Data Pre-processing

Load needed libraries

library(fastDummies)
library(readr)
library(ggplot2)
library(dplyr)
library(caret)
library(glmnet)
library(boot)
library(tree)
library(ranger)
library(xgboost)
library(gbm)
library(vip)
library(ISLR)

Set the seed for reproducibility

set.seed(1)

Load the dataset

original_lc_data <- read.csv("LCdata.csv",sep = ";")
lc_data <- original_lc_data

remove attributes not available for prediction

lc_data <- subset(lc_data, select = -c(collection_recovery_fee, installment, issue_d,
                                       last_pymnt_amnt, last_pymnt_d, loan_status,
                                       next_pymnt_d, out_prncp, out_prncp_inv,
                                       pymnt_plan, recoveries,
                                       term, total_pymnt,
                                       total_pymnt_inv,total_rec_int, total_rec_late_fee,                                                  total_rec_prncp))
summary(lc_data)
       id             member_id          loan_amnt      funded_amnt    funded_amnt_inv    int_rate    
 Min.   :   54734   Min.   :   70473   Min.   :  500   Min.   :  500   Min.   :    0   Min.   : 5.32  
 1st Qu.: 9207230   1st Qu.:10877939   1st Qu.: 8000   1st Qu.: 8000   1st Qu.: 8000   1st Qu.: 9.99  
 Median :34433372   Median :37095300   Median :13000   Median :13000   Median :13000   Median :12.99  
 Mean   :32463636   Mean   :35000265   Mean   :14754   Mean   :14741   Mean   :14702   Mean   :13.24  
 3rd Qu.:54900100   3rd Qu.:58470266   3rd Qu.:20000   3rd Qu.:20000   3rd Qu.:20000   3rd Qu.:16.20  
 Max.   :68617057   Max.   :73544841   Max.   :35000   Max.   :35000   Max.   :35000   Max.   :28.99  
                                                                                                      
  emp_title          emp_length        home_ownership       annual_inc      verification_status     url           
 Length:798641      Length:798641      Length:798641      Min.   :      0   Length:798641       Length:798641     
 Class :character   Class :character   Class :character   1st Qu.:  45000   Class :character    Class :character  
 Mode  :character   Mode  :character   Mode  :character   Median :  65000   Mode  :character    Mode  :character  
                                                          Mean   :  75014                                         
                                                          3rd Qu.:  90000                                         
                                                          Max.   :9500000                                         
                                                          NA's   :4                                               
     desc             purpose             title             zip_code          addr_state             dti         
 Length:798641      Length:798641      Length:798641      Length:798641      Length:798641      Min.   :   0.00  
 Class :character   Class :character   Class :character   Class :character   Class :character   1st Qu.:  11.91  
 Mode  :character   Mode  :character   Mode  :character   Mode  :character   Mode  :character   Median :  17.66  
                                                                                                Mean   :  18.16  
                                                                                                3rd Qu.:  23.95  
                                                                                                Max.   :9999.00  
                                                                                                                 
  delinq_2yrs      earliest_cr_line   inq_last_6mths    mths_since_last_delinq mths_since_last_record
 Min.   : 0.0000   Length:798641      Min.   : 0.0000   Min.   :  0.0          Min.   :  0.0         
 1st Qu.: 0.0000   Class :character   1st Qu.: 0.0000   1st Qu.: 15.0          1st Qu.: 51.0         
 Median : 0.0000   Mode  :character   Median : 0.0000   Median : 31.0          Median : 70.0         
 Mean   : 0.3145                      Mean   : 0.6947   Mean   : 34.1          Mean   : 70.1         
 3rd Qu.: 0.0000                      3rd Qu.: 1.0000   3rd Qu.: 50.0          3rd Qu.: 92.0         
 Max.   :39.0000                      Max.   :33.0000   Max.   :188.0          Max.   :129.0         
 NA's   :25                           NA's   :25        NA's   :408818         NA's   :675190        
    open_acc        pub_rec          revol_bal         revol_util       total_acc      initial_list_status
 Min.   : 0.00   Min.   : 0.0000   Min.   :      0   Min.   :  0.00   Min.   :  1.00   Length:798641      
 1st Qu.: 8.00   1st Qu.: 0.0000   1st Qu.:   6443   1st Qu.: 37.70   1st Qu.: 17.00   Class :character   
 Median :11.00   Median : 0.0000   Median :  11876   Median : 56.00   Median : 24.00   Mode  :character   
 Mean   :11.55   Mean   : 0.1953   Mean   :  16930   Mean   : 55.05   Mean   : 25.27                      
 3rd Qu.:14.00   3rd Qu.: 0.0000   3rd Qu.:  20839   3rd Qu.: 73.50   3rd Qu.: 32.00                      
 Max.   :90.00   Max.   :63.0000   Max.   :2904836   Max.   :892.30   Max.   :169.00                      
 NA's   :25      NA's   :25        NA's   :2         NA's   :454      NA's   :25                          
 last_credit_pull_d collections_12_mths_ex_med mths_since_last_major_derog  policy_code application_type  
 Length:798641      Min.   : 0.00000           Min.   :  0.0               Min.   :1    Length:798641     
 Class :character   1st Qu.: 0.00000           1st Qu.: 27.0               1st Qu.:1    Class :character  
 Mode  :character   Median : 0.00000           Median : 44.0               Median :1    Mode  :character  
                    Mean   : 0.01447           Mean   : 44.1               Mean   :1                      
                    3rd Qu.: 0.00000           3rd Qu.: 61.0               3rd Qu.:1                      
                    Max.   :20.00000           Max.   :188.0               Max.   :1                      
                    NA's   :126                NA's   :599107                                             
 annual_inc_joint   dti_joint      verification_status_joint acc_now_delinq       tot_coll_amt    
 Min.   : 17950   Min.   : 3.0     Length:798641             Min.   : 0.000000   Min.   :      0  
 1st Qu.: 76167   1st Qu.:13.3     Class :character          1st Qu.: 0.000000   1st Qu.:      0  
 Median :101886   Median :17.7     Mode  :character          Median : 0.000000   Median :      0  
 Mean   :110745   Mean   :18.4                               Mean   : 0.005026   Mean   :    228  
 3rd Qu.:133000   3rd Qu.:22.6                               3rd Qu.: 0.000000   3rd Qu.:      0  
 Max.   :500000   Max.   :43.9                               Max.   :14.000000   Max.   :9152545  
 NA's   :798181   NA's   :798183                             NA's   :25          NA's   :63276    
  tot_cur_bal       open_acc_6m       open_il_6m      open_il_12m      open_il_24m     mths_since_rcnt_il
 Min.   :      0   Min.   : 0.0     Min.   : 0.0     Min.   : 0.0     Min.   : 0.0     Min.   :  0.0     
 1st Qu.:  29861   1st Qu.: 0.0     1st Qu.: 1.0     1st Qu.: 0.0     1st Qu.: 0.0     1st Qu.:  6.0     
 Median :  80647   Median : 1.0     Median : 2.0     Median : 0.0     Median : 1.0     Median : 12.0     
 Mean   : 139508   Mean   : 1.1     Mean   : 2.9     Mean   : 0.8     Mean   : 1.7     Mean   : 21.1     
 3rd Qu.: 208229   3rd Qu.: 2.0     3rd Qu.: 4.0     3rd Qu.: 1.0     3rd Qu.: 2.0     3rd Qu.: 23.0     
 Max.   :8000078   Max.   :14.0     Max.   :33.0     Max.   :12.0     Max.   :19.0     Max.   :363.0     
 NA's   :63276     NA's   :779525   NA's   :779525   NA's   :779525   NA's   :779525   NA's   :780030    
  total_bal_il       il_util        open_rv_12m      open_rv_24m       max_bal_bc        all_util     
 Min.   :     0   Min.   :  0.0    Min.   : 0.0     Min.   : 0       Min.   :    0    Min.   :  0.0   
 1st Qu.: 10164   1st Qu.: 58.4    1st Qu.: 0.0     1st Qu.: 1       1st Qu.: 2406    1st Qu.: 47.6   
 Median : 24544   Median : 74.8    Median : 1.0     Median : 2       Median : 4502    Median : 61.9   
 Mean   : 36428   Mean   : 71.5    Mean   : 1.4     Mean   : 3       Mean   : 5878    Mean   : 60.8   
 3rd Qu.: 47640   3rd Qu.: 87.7    3rd Qu.: 2.0     3rd Qu.: 4       3rd Qu.: 7774    3rd Qu.: 75.2   
 Max.   :878459   Max.   :223.3    Max.   :22.0     Max.   :43       Max.   :83047    Max.   :151.4   
 NA's   :779525   NA's   :782007   NA's   :779525   NA's   :779525   NA's   :779525   NA's   :779525  
 total_rev_hi_lim      inq_fi        total_cu_tl      inq_last_12m   
 Min.   :      0   Min.   : 0.0     Min.   : 0.0     Min.   :-4      
 1st Qu.:  13900   1st Qu.: 0.0     1st Qu.: 0.0     1st Qu.: 0      
 Median :  23700   Median : 0.0     Median : 0.0     Median : 2      
 Mean   :  32093   Mean   : 0.9     Mean   : 1.5     Mean   : 2      
 3rd Qu.:  39800   3rd Qu.: 1.0     3rd Qu.: 2.0     3rd Qu.: 3      
 Max.   :9999999   Max.   :16.0     Max.   :35.0     Max.   :32      
 NA's   :63276     NA's   :779525   NA's   :779525   NA's   :779525  

First we delete the columns which aren’t useful for our prediction

lc_data$id <- NULL
lc_data$member_id <- NULL
lc_data$zip_code <- NULL
lc_data$url <- NULL

Looks like policy_code contains just value equal to 1, it can be removed

lc_data$policy_code <- NULL

Remove additional columns which are related to the historical data

lc_data$last_credit_pull_d <- NULL

Then we delete the columns which can’t be converted to categorical and require NLP

lc_data$title <- NULL
lc_data$desc <- NULL
lc_data$emp_title <- NULL

let’s examine the loan_amnt column

sum(is.na(lc_data$loan_amnt))
[1] 0
cor(lc_data$loan_amnt, lc_data$int_rate)
[1] 0.1447189
hist(lc_data$loan_amnt, breaks = 20, main = "loan_amnt distribution", xlab = "loan_amnt", col = "lightblue", border = "black")

ggplot(data = lc_data, mapping = aes(x=int_rate,y=loan_amnt)) + geom_boxplot()

standardize loan_amnt

#lc_data$loan_amnt <- scale(lc_data$loan_amnt)

let’s examine the funded_amnt column

sum(is.na(lc_data$funded_amnt))
[1] 0
cor(lc_data$funded_amnt, lc_data$int_rate)
[1] 0.1448634
hist(lc_data$funded_amnt, breaks = 20, main = "funded_amnt distribution", xlab = "funded_amnt", col = "lightblue", border = "black")

as we can see, funded_amnt is almost the same as the loan_amnt column, consequently, we remove it.

lc_data$funded_amnt <- NULL 

let’s examine the funded_amnt_inv column

sum(is.na(lc_data$funded_amnt_inv))
[1] 0
cor(lc_data$funded_amnt_inv, lc_data$int_rate)
[1] 0.1449083
hist(lc_data$funded_amnt_inv, breaks = 20, main = "funded_amnt_inv distribution", xlab = "funded_amnt_inv", col = "lightblue", border = "black")

remove funded_amnt_inv for the same reason as above

lc_data$funded_amnt_inv <- NULL

let’s see the int_rate distribution.

hist(lc_data$int_rate, breaks = 20, main = "int_rate distribution", xlab = "int_rate", col = "lightblue", border = "black")

Standardize int rate:

#lc_data$int_rate <- scale(lc_data$int_rate)

we delete the emp_title column as there are several entries for the same job title and because there are too many different values for one-hot encoding. In addition, some titles are unclear (NLP required)

n_distinct(lc_data$emp_title)
[1] 0

As we can observe, there are 40363 NAs. We can assume 40363 do not work.

barplot(table(lc_data$emp_length),
        xlab = "emp_length years", 
        ylab = "Frequency", 
        col = "skyblue", 
        border = "black",
        cex.names = 0.6)  # The size of the main title

Since emp_length seems to be categorical, we transform it to as a factor and then as numeric. The conversion to numeric is needed for supporting the XGBoost

lc_data$emp_length <- as.factor(lc_data$emp_length)
ggplot(data = lc_data, mapping = aes(x=int_rate,y=emp_length)) + geom_boxplot()

lc_data$emp_length <- as.numeric(lc_data$emp_length)

Cleaning of home_ownership:

During the data cleaning phase, our analysis revealed that the variable “home_ownership” does not show a distinct correlation with interest rates. Specifically, among the categories, “ANY” and “OTHER” contain 2 and 154 cases, respectively, while the “NONE” category comprises 39 cases. Although the “NONE” category appears to demonstrate a higher interest rate compared to others, the limited sample size of 39 cases raises doubts about the reliability of this observation. Notably, the “NONE” category might pertain to individuals experiencing homelessness, prompting ethical concerns about loan provision to this demographic.

table(lc_data$home_ownership)

     ANY MORTGAGE     NONE    OTHER      OWN     RENT 
       2   399151       45      155    78789   320499 
ggplot(data = lc_data, mapping = aes(x=int_rate,y=home_ownership)) + geom_boxplot()

Then, we retain mortgage, own and rent:

lc_data <- lc_data %>% filter(home_ownership %in% c("MORTGAGE","OWN","RENT"))
lc_data$home_ownership <- as.numeric(as.factor(lc_data$home_ownership))

application joint handling


# merging annual income
lc_data <- lc_data %>% mutate(
    annual_inc_merged = ifelse(is.na(annual_inc_joint)== TRUE, annual_inc,annual_inc_joint)) 

lc_data <- lc_data %>% select(-annual_inc,-annual_inc_joint)


# merging debt to income ratio
lc_data <- lc_data %>% mutate(
    dti_merged = ifelse(is.na(dti_joint)== TRUE, dti,dti_joint)) 

lc_data <- lc_data %>% select(-dti,-dti_joint)

Upon reviewing the summary again, it becomes apparent that there are merely 460 joint applications, constituting a small subset within the extensive dataset of around 800k rows. Through consolidating the debt-to-income ratios (dti’s), we can pinpoint the data pertinent to our research objectives. Hence, it is advisable to eliminate the columns verification_status_joint and application_type to prevent introducing unwarranted variability into our analysis.

table(lc_data$verification_status)

   Not Verified Source Verified        Verified 
         240255          296631          261553 
table(lc_data$verification_status_joint)

                   Not Verified Source Verified        Verified 
         797979             253              53             154 
lc_data$verification_status <- as.numeric(as.factor(lc_data$verification_status))
lc_data <- lc_data %>% select(-verification_status_joint, -application_type)

Let’s checl if other is NA or a real value for purpose. It’s a real one, so we don’t have to handle it.

lc_data$purpose <- as.factor(lc_data$purpose)
ggplot(data = lc_data, mapping = aes(x=int_rate,y=purpose)) + geom_boxplot()

lc_data$purpose <- as.numeric(lc_data$purpose)

Let’s have a glance to the state address:

table(lc_data$addr_state)

    AK     AL     AR     AZ     CA     CO     CT     DC     DE     FL     GA     HI     IA     ID     IL     IN 
  1992  10101   5953  18359 116578  16934  12154   2188   2268  54819  26146   4112     13     11  31880  12393 
    KS     KY     LA     MA     MD     ME     MI     MN     MO     MS     MT     NC     ND     NE     NH     NJ 
  7105   7726   9498  18546  18906    469  20678  14306  12821   3455   2286  22135    431   1064   3865  29991 
    NM     NV     NY     OH     OK     OR     PA     RI     SC     SD     TN     TX     UT     VA     VT     WA 
  4428  11155  66790  26682   7266   9806  28221   3499   9609   1615  11618  63982   5629  23616   1606  17470 
    WI     WV     WY 
 10446   3977   1841 
lc_data$addr_state <- as.factor(lc_data$addr_state)
ggplot(data = lc_data, mapping = aes(x=int_rate,y=addr_state)) + geom_boxplot()

lc_data$addr_state <- as.numeric(lc_data$addr_state)

Regarding delinquency in the last 2 years, there are few NAs then remove them:

lc_data <- lc_data %>% 
    filter(!(is.na(delinq_2yrs)))
lc_data <- lc_data %>%
  mutate(mths_since_delinq_cat = ifelse(
    is.na(mths_since_last_delinq) == TRUE,
    "NONE",
    ifelse(
      mths_since_last_delinq <= 12,
      "Less_1_Y",
      ifelse(
        mths_since_last_delinq <= 24,
        "Less_2_Y",
        ifelse(
          mths_since_last_delinq <= 36,
          "Less_3_Y",
          ifelse(mths_since_last_delinq <= 48, "Less_4_Y", "More_4_Y")
        )
      )
    )
  )) %>% select(-mths_since_last_delinq)
          
lc_data$mths_since_delinq_cat <- as.factor(lc_data$mths_since_delinq_cat)
ggplot(data = lc_data, mapping = aes(x=int_rate,y=mths_since_delinq_cat))+geom_boxplot()

lc_data$mths_since_delinq_cat <- as.numeric(lc_data$mths_since_delinq_cat)
lc_data <- lc_data %>%
  mutate(mths_since_last_record_cat = ifelse(
    is.na(mths_since_last_record) == TRUE,
    "NONE",
    ifelse(
      mths_since_last_record <= 12,
      "Less_1_Y",
      ifelse(
        mths_since_last_record <= 24,
        "Less_2_Y",
        ifelse(
          mths_since_last_record <= 36,
          "Less_3_Y",
          ifelse(mths_since_last_record <= 48, "Less_4_Y", "More_4_Y")
        )
      )
    )
  )) %>% select(-mths_since_last_record)

lc_data$mths_since_last_record_cat <- as.factor(lc_data$mths_since_last_record_cat)
ggplot(data = lc_data, mapping = aes(x=int_rate,y=mths_since_last_record_cat))+geom_boxplot()

lc_data$mths_since_last_record_cat <- as.numeric(lc_data$mths_since_last_record_cat)
lc_data <-lc_data %>% 
  mutate(mths_since_last_major_derog_cat =  ifelse(
    is.na(mths_since_last_major_derog) == TRUE,
    "NONE",
    ifelse(
      mths_since_last_major_derog <= 12,
      "Less_1_Y",
      ifelse(
        mths_since_last_major_derog <= 24,
        "Less_2_Y",
        ifelse(
          mths_since_last_major_derog <= 36,
          "Less_3_Y",
          ifelse(mths_since_last_major_derog <= 48, "Less_4_Y", "More_4_Y")
        )
      )
    )
  )) %>% select(-mths_since_last_major_derog)

lc_data$mths_since_last_major_derog_cat <- as.factor(lc_data$mths_since_last_major_derog_cat)
ggplot(data = lc_data, mapping = aes(x=int_rate,y=mths_since_last_major_derog_cat))+geom_boxplot()

lc_data$mths_since_last_major_derog_cat <- as.numeric(lc_data$mths_since_last_major_derog_cat)
lc_data$initial_list_status <- as.factor(lc_data$initial_list_status)
ggplot(data = lc_data, mapping = aes(x=int_rate,y=initial_list_status))+geom_boxplot()

lc_data$initial_list_status <- as.numeric(lc_data$initial_list_status)

Let’s check which columns still have null values

colSums(is.na(lc_data))
                      loan_amnt                        int_rate                      emp_length 
                              0                               0                               0 
                 home_ownership             verification_status                         purpose 
                              0                               0                               0 
                     addr_state                     delinq_2yrs                earliest_cr_line 
                              0                               0                               0 
                 inq_last_6mths                        open_acc                         pub_rec 
                              0                               0                               0 
                      revol_bal                      revol_util                       total_acc 
                              2                             428                               0 
            initial_list_status      collections_12_mths_ex_med                  acc_now_delinq 
                              0                              99                               0 
                   tot_coll_amt                     tot_cur_bal                     open_acc_6m 
                          63132                           63132                          779302 
                     open_il_6m                     open_il_12m                     open_il_24m 
                         779302                          779302                          779302 
             mths_since_rcnt_il                    total_bal_il                         il_util 
                         779807                          779302                          781784 
                    open_rv_12m                     open_rv_24m                      max_bal_bc 
                         779302                          779302                          779302 
                       all_util                total_rev_hi_lim                          inq_fi 
                         779302                           63132                          779302 
                    total_cu_tl                    inq_last_12m               annual_inc_merged 
                         779302                          779302                               0 
                     dti_merged           mths_since_delinq_cat      mths_since_last_record_cat 
                              0                               0                               0 
mths_since_last_major_derog_cat 
                              0 

The columns revol_bal and revol_util contain only few NA values, those values can’t be replaced with 0, then we filter the values which are not NA

lc_data <- lc_data %>% 
    filter(!(is.na(revol_bal))) %>% 
        filter(!(is.na(revol_util)))

Let’s check which columns still have null values

names(which(colSums(is.na(lc_data)) > 0))
 [1] "collections_12_mths_ex_med" "tot_coll_amt"               "tot_cur_bal"               
 [4] "open_acc_6m"                "open_il_6m"                 "open_il_12m"               
 [7] "open_il_24m"                "mths_since_rcnt_il"         "total_bal_il"              
[10] "il_util"                    "open_rv_12m"                "open_rv_24m"               
[13] "max_bal_bc"                 "all_util"                   "total_rev_hi_lim"          
[16] "inq_fi"                     "total_cu_tl"                "inq_last_12m"              

Replace null values with 0 where is possible

lc_data <-
  lc_data %>%
  mutate(open_acc_6m = ifelse(is.na(open_acc_6m) == TRUE, 0, open_acc_6m)) %>%
  mutate(tot_cur_bal = ifelse(is.na(tot_cur_bal) == TRUE, 0, tot_cur_bal)) %>%
  mutate(open_il_6m = ifelse(is.na(open_il_6m) == TRUE, 0, open_il_6m)) %>%
  mutate(open_il_12m = ifelse(is.na(open_il_12m) == TRUE, 0, open_il_12m)) %>%
  mutate(open_il_24m = ifelse(is.na(open_il_24m) == TRUE, 0, open_il_24m)) %>%
  mutate(mths_since_rcnt_il = ifelse(is.na(mths_since_rcnt_il) == TRUE, 0, mths_since_rcnt_il)) %>%
  mutate(total_bal_il = ifelse(is.na(total_bal_il) == TRUE, 0, total_bal_il)) %>%
  mutate(il_util = ifelse(is.na(il_util) == TRUE, 0, il_util)) %>%
  mutate(open_rv_12m = ifelse(is.na(open_rv_12m) == TRUE, 0, open_rv_12m)) %>%
  mutate(total_rev_hi_lim = ifelse(is.na(total_rev_hi_lim) == TRUE, 0, total_rev_hi_lim)) %>%
  mutate(max_bal_bc = ifelse(is.na(max_bal_bc) == TRUE, 0, max_bal_bc)) %>%
  mutate(all_util = ifelse(is.na(all_util) == TRUE, 0, all_util)) %>%
  mutate(inq_fi = ifelse(is.na(inq_fi) == TRUE, 0, inq_fi)) %>%
  mutate(total_cu_tl = ifelse(is.na(total_cu_tl) == TRUE, 0, total_cu_tl)) %>%
  mutate(inq_last_12m = ifelse(is.na(inq_last_12m) == TRUE, 0, inq_last_12m)) %>%
  mutate(open_rv_24m = ifelse(is.na(open_rv_24m) == TRUE, 0, open_rv_24m)) %>%
  mutate(tot_coll_amt = ifelse(is.na(tot_coll_amt)== TRUE,0, tot_coll_amt)) %>%
  mutate(collections_12_mths_ex_med = ifelse(is.na(collections_12_mths_ex_med)== TRUE,0, collections_12_mths_ex_med))

earliest_cr_line contains the month the borrower’s earliest reported credit line was opened. Even if this date consists only on month and year, still there are too many unique values. We could transform the dates in to a numerical value, by converting them from date into Unix Time. This unit measures time by the number of seconds that have elapsed since 00:00:00 UTC on 1 January 1970. Since this column doesn’t contain the day number, we take as a reference the first day of the month.

lc_data <- lc_data %>% 
    filter(!(is.na(earliest_cr_line)))

# function to replace dates with unix time
to_unix_time <- function(date) {
  tmp <- paste("01", date, sep="-")
  return (as.numeric(as.POSIXct(tmp, format="%d-%b-%Y", tz="UTC")))
}

# map dates to unix time
lc_data$earliest_cr_line <- apply(lc_data, 1, function(row) to_unix_time(row["earliest_cr_line"]))

# standardize them
#lc_data$earliest_cr_line <- scale(lc_data$earliest_cr_line)
summary(lc_data)
   loan_amnt        int_rate       emp_length    home_ownership  verification_status    purpose      
 Min.   :  500   Min.   : 5.32   Min.   : 1.00   Min.   :1.000   Min.   :1.000       Min.   : 1.000  
 1st Qu.: 8000   1st Qu.: 9.99   1st Qu.: 3.00   1st Qu.:1.000   1st Qu.:1.000       1st Qu.: 3.000  
 Median :13000   Median :12.99   Median : 4.00   Median :2.000   Median :2.000       Median : 3.000  
 Mean   :14757   Mean   :13.24   Mean   : 5.11   Mean   :1.901   Mean   :2.027       Mean   : 3.571  
 3rd Qu.:20000   3rd Qu.:16.20   3rd Qu.: 7.00   3rd Qu.:3.000   3rd Qu.:3.000       3rd Qu.: 3.000  
 Max.   :35000   Max.   :28.99   Max.   :12.00   Max.   :3.000   Max.   :3.000       Max.   :14.000  
   addr_state     delinq_2yrs      earliest_cr_line     inq_last_6mths       open_acc        pub_rec       
 Min.   : 1.00   Min.   : 0.0000   Min.   :-820540800   Min.   : 0.0000   Min.   : 1.00   Min.   : 0.0000  
 1st Qu.:10.00   1st Qu.: 0.0000   1st Qu.: 770428800   1st Qu.: 0.0000   1st Qu.: 8.00   1st Qu.: 0.0000  
 Median :24.00   Median : 0.0000   Median : 936144000   Median : 0.0000   Median :11.00   Median : 0.0000  
 Mean   :24.14   Mean   : 0.3143   Mean   : 889273164   Mean   : 0.6947   Mean   :11.55   Mean   : 0.1954  
 3rd Qu.:37.00   3rd Qu.: 0.0000   3rd Qu.:1051747200   3rd Qu.: 1.0000   3rd Qu.:14.00   3rd Qu.: 0.0000  
 Max.   :51.00   Max.   :39.0000   Max.   :1351728000   Max.   :33.0000   Max.   :90.00   Max.   :63.0000  
   revol_bal         revol_util       total_acc      initial_list_status collections_12_mths_ex_med
 Min.   :      0   Min.   :  0.00   Min.   :  1.00   Min.   :1.000       Min.   : 0.00000          
 1st Qu.:   6450   1st Qu.: 37.70   1st Qu.: 17.00   1st Qu.:1.000       1st Qu.: 0.00000          
 Median :  11881   Median : 56.00   Median : 24.00   Median :1.000       Median : 0.00000          
 Mean   :  16934   Mean   : 55.05   Mean   : 25.27   Mean   :1.485       Mean   : 0.01448          
 3rd Qu.:  20844   3rd Qu.: 73.50   3rd Qu.: 32.00   3rd Qu.:2.000       3rd Qu.: 0.00000          
 Max.   :2904836   Max.   :892.30   Max.   :169.00   Max.   :2.000       Max.   :20.00000          
 acc_now_delinq       tot_coll_amt      tot_cur_bal       open_acc_6m         open_il_6m        open_il_12m      
 Min.   : 0.000000   Min.   :      0   Min.   :      0   Min.   : 0.00000   Min.   : 0.00000   Min.   : 0.00000  
 1st Qu.: 0.000000   1st Qu.:      0   1st Qu.:  23195   1st Qu.: 0.00000   1st Qu.: 0.00000   1st Qu.: 0.00000  
 Median : 0.000000   Median :      0   Median :  65402   Median : 0.00000   Median : 0.00000   Median : 0.00000  
 Mean   : 0.005026   Mean   :    210   Mean   : 128461   Mean   : 0.02641   Mean   : 0.06982   Mean   : 0.01816  
 3rd Qu.: 0.000000   3rd Qu.:      0   3rd Qu.: 195864   3rd Qu.: 0.00000   3rd Qu.: 0.00000   3rd Qu.: 0.00000  
 Max.   :14.000000   Max.   :9152545   Max.   :8000078   Max.   :14.00000   Max.   :33.00000   Max.   :12.00000  
  open_il_24m       mths_since_rcnt_il  total_bal_il       il_util         open_rv_12m        open_rv_24m      
 Min.   : 0.00000   Min.   :  0.0000   Min.   :     0   Min.   :  0.000   Min.   : 0.00000   Min.   : 0.00000  
 1st Qu.: 0.00000   1st Qu.:  0.0000   1st Qu.:     0   1st Qu.:  0.000   1st Qu.: 0.00000   1st Qu.: 0.00000  
 Median : 0.00000   Median :  0.0000   Median :     0   Median :  0.000   Median : 0.00000   Median : 0.00000  
 Mean   : 0.03991   Mean   :  0.4918   Mean   :   872   Mean   :  1.489   Mean   : 0.03316   Mean   : 0.07114  
 3rd Qu.: 0.00000   3rd Qu.:  0.0000   3rd Qu.:     0   3rd Qu.:  0.000   3rd Qu.: 0.00000   3rd Qu.: 0.00000  
 Max.   :19.00000   Max.   :363.0000   Max.   :878459   Max.   :223.300   Max.   :22.00000   Max.   :43.00000  
   max_bal_bc         all_util       total_rev_hi_lim      inq_fi          total_cu_tl        inq_last_12m     
 Min.   :    0.0   Min.   :  0.000   Min.   :      0   Min.   : 0.00000   Min.   : 0.00000   Min.   :-4.00000  
 1st Qu.:    0.0   1st Qu.:  0.000   1st Qu.:  11700   1st Qu.: 0.00000   1st Qu.: 0.00000   1st Qu.: 0.00000  
 Median :    0.0   Median :  0.000   Median :  21800   Median : 0.00000   Median : 0.00000   Median : 0.00000  
 Mean   :  140.8   Mean   :  1.456   Mean   :  29564   Mean   : 0.02262   Mean   : 0.03668   Mean   : 0.04733  
 3rd Qu.:    0.0   3rd Qu.:  0.000   3rd Qu.:  37900   3rd Qu.: 0.00000   3rd Qu.: 0.00000   3rd Qu.: 0.00000  
 Max.   :83047.0   Max.   :151.400   Max.   :9999999   Max.   :16.00000   Max.   :35.00000   Max.   :32.00000  
 annual_inc_merged   dti_merged    mths_since_delinq_cat mths_since_last_record_cat mths_since_last_major_derog_cat
 Min.   :   1896   Min.   : 0.00   Min.   :1.000         Min.   :1.000              Min.   :1.000                  
 1st Qu.:  45000   1st Qu.:11.91   1st Qu.:3.000         1st Qu.:6.000              1st Qu.:6.000                  
 Median :  65000   Median :17.66   Median :6.000         Median :6.000              Median :6.000                  
 Mean   :  75038   Mean   :18.13   Mean   :4.576         Mean   :5.779              Mean   :5.435                  
 3rd Qu.:  90000   3rd Qu.:23.94   3rd Qu.:6.000         3rd Qu.:6.000              3rd Qu.:6.000                  
 Max.   :9500000   Max.   :43.86   Max.   :6.000         Max.   :6.000              Max.   :6.000                  
#round(cor(lc_data),2)

# TODO: (parte vecchia), split 80/20 e linear regression...
# Create indices for splitting (80% train, 20% test)
train_indices <- createDataPartition(lc_data$int_rate, p = 0.8, list = FALSE)

# Create training and testing datasets
train_data <- lc_data[train_indices, ]
test_data <- lc_data[-train_indices, ]

#### Linear Regression ####
#lm.fit <- lm(int_rate ~ ., data = train_data)

# TODO: check collinearity and multicollinearity
#vif(lm.fit) # there is multicollinearity
#cor(lc_data) 

# Make predictions on training and testing data
#train_predictions <- predict(lm.fit, newdata = train_data)
#test_predictions <- predict(lm.fit, newdata = test_data)

# Evaluate model performance on training data
#train_rmse <- sqrt(mean((train_predictions - train_data$int_rate)^2))
#train_r_squared <- summary(lm.fit)$r.squared

# Evaluate model performance on testing data
#test_rmse <- sqrt(mean((test_predictions - test_data$int_rate)^2))
#test_r_squared <- summary(lm.fit, test_data)$r.squared

# Print evaluation metrics
#cat("Training RMSE:", train_rmse, "\n")
#cat("Training R-squared:", train_r_squared, "\n")
#rmse <- sqrt(mean(lm.fit$residuals^2))
#print(rmse)
# 1% of the total rows
sample_train_size <- floor(0.01 * nrow(train_data))
sample_test_size <- floor(0.01 * nrow(test_data))

# Randomly select 1% of the rows
sampled_train_data <- train_data[sample(nrow(train_data), size = sample_train_size, replace = FALSE), ]
sampled_test_data <- test_data[sample(nrow(test_data), size = sample_test_size, replace = FALSE), ]

sampled_train_data <- train_data
sampled_test_data <- test_data

#### Linear Regression ####

lm.fit <- lm(int_rate ~ ., data = sampled_train_data)

# Make predictions on the training and testing data
lm.train_predictions <- predict(lm.fit, newdata = sampled_train_data)
lm.test_predictions <- predict(lm.fit, newdata = sampled_test_data)

# Calculate Mean Squared Error (MSE) for training and testing
lm.train_mse <- mean((lm.train_predictions - sampled_train_data$int_rate)^2)
lm.test_mse <- mean((lm.test_predictions - sampled_test_data$int_rate)^2)

# Calculate Root Mean Squared Error (RMSE) for training and testing
lm.train_rmse <- sqrt(lm.train_mse)
lm.test_rmse <- sqrt(lm.test_mse)

# Calculate Mean Absolute Error (MAE) for training and testing
lm.train_mae <- mean(abs(lm.train_predictions - sampled_train_data$int_rate))
lm.test_mae <- mean(abs(lm.test_predictions - sampled_test_data$int_rate))

# Calculate R-squared (R²) for training and testing
lm.train_r2 <- 1 - (sum((sampled_train_data$int_rate - lm.train_predictions)^2) / sum((sampled_train_data$int_rate - mean(sampled_train_data$int_rate))^2))
lm.test_r2 <- 1 - (sum((sampled_test_data$int_rate - lm.test_predictions)^2) / sum((sampled_test_data$int_rate - mean(sampled_test_data$int_rate))^2))

# Display the metrics
cat("Training MSE:", lm.train_mse, "\n")
Training MSE: 13.26248 
cat("Testing MSE:", lm.test_mse, "\n")
Testing MSE: 13.6664 
cat("Training RMSE:", lm.train_rmse, "\n")
Training RMSE: 3.641768 
cat("Testing RMSE:", lm.test_rmse, "\n")
Testing RMSE: 3.696809 
cat("Training MAE:", lm.train_mae, "\n")
Training MAE: 2.885102 
cat("Testing MAE:", lm.test_mae, "\n")
Testing MAE: 2.889154 
cat("Training R-squared (R²):", lm.train_r2, "\n")
Training R-squared (R²): 0.3094189 
cat("Testing R-squared (R²):", lm.test_r2, "\n")
Testing R-squared (R²): 0.2880591 
#### Linear Regresion applying Cross Validation with k=2 to k=10  ####


# Assuming 'sampled_train_data' is your training data set

# Initialize lists to store models and their results
models <- list()
results <- data.frame()

# Define the number of folds for cross-validation
num_folds <- 10
folds <- createFolds(sampled_train_data$int_rate, k = num_folds, list = TRUE)

# Perform k-fold cross-validation
for(i in seq_along(folds)) {
  # Split the data into training and testing for the current fold
  train_indices <- folds[[i]]
  test_indices <- setdiff(seq_len(nrow(sampled_train_data)), train_indices)
  
  train_data_fold <- sampled_train_data[train_indices, ]
  test_data_fold <- sampled_train_data[test_indices, ]
  
  # Fit the model on the training fold
  lm_model <- lm(int_rate ~ ., data = train_data_fold)
  models[[i]] <- lm_model  # Store the model
  
  # Make predictions on the training and testing fold
  train_predictions <- predict(lm_model, newdata = train_data_fold)
  test_predictions <- predict(lm_model, newdata = test_data_fold)
  
  # Calculate metrics for training fold
  train_mse <- mean((train_predictions - train_data_fold$int_rate)^2)
  train_rmse <- sqrt(train_mse)
  train_mae <- mean(abs(train_predictions - train_data_fold$int_rate))
  train_r2 <- summary(lm_model)$r.squared
  
  # Calculate metrics for testing fold
  test_mse <- mean((test_predictions - test_data_fold$int_rate)^2)
  test_rmse <- sqrt(test_mse)
  test_mae <- mean(abs(test_predictions - test_data_fold$int_rate))
  test_r2 <- 1 - (sum((test_data_fold$int_rate - test_predictions)^2) / sum((test_data_fold$int_rate - mean(test_data_fold$int_rate))^2))
  
  # Store metrics in the results dataframe
  results <- rbind(results, data.frame(
    Fold = i,
    Train_MSE = train_mse, Test_MSE = test_mse,
    Train_RMSE = train_rmse, Test_RMSE = test_rmse,
    Train_MAE = train_mae, Test_MAE = test_mae,
    Train_R2 = train_r2, Test_R2 = test_r2
  ))
}

# Display the models and their metrics
print(models)
[[1]]

Call:
lm(formula = int_rate ~ ., data = train_data_fold)

Coefficients:
                    (Intercept)                        loan_amnt                       emp_length  
                      6.335e+00                        1.261e-04                        1.064e-02  
                 home_ownership              verification_status                          purpose  
                      1.931e-01                        8.601e-01                        3.559e-01  
                     addr_state                      delinq_2yrs                 earliest_cr_line  
                      2.676e-03                        4.429e-02                        2.146e-09  
                 inq_last_6mths                         open_acc                          pub_rec  
                      9.875e-01                        6.126e-02                        4.337e-01  
                      revol_bal                       revol_util                        total_acc  
                      8.094e-06                        4.396e-02                       -3.199e-02  
            initial_list_status       collections_12_mths_ex_med                   acc_now_delinq  
                     -6.185e-01                        2.261e-01                        1.500e+00  
                   tot_coll_amt                      tot_cur_bal                      open_acc_6m  
                      2.307e-05                       -1.057e-06                       -1.049e-01  
                     open_il_6m                      open_il_12m                      open_il_24m  
                     -1.773e-01                        6.202e-01                        8.539e-02  
             mths_since_rcnt_il                     total_bal_il                          il_util  
                     -7.375e-03                        1.206e-06                       -1.392e-04  
                    open_rv_12m                      open_rv_24m                       max_bal_bc  
                      2.434e-01                        4.545e-03                       -4.965e-05  
                       all_util                 total_rev_hi_lim                           inq_fi  
                     -6.684e-03                       -2.158e-05                        4.006e-02  
                    total_cu_tl                     inq_last_12m                annual_inc_merged  
                     -5.500e-02                        6.120e-02                       -7.378e-06  
                     dti_merged            mths_since_delinq_cat       mths_since_last_record_cat  
                      6.407e-02                       -1.807e-01                       -1.394e-01  
mths_since_last_major_derog_cat  
                     -1.629e-01  


[[2]]

Call:
lm(formula = int_rate ~ ., data = train_data_fold)

Coefficients:
                    (Intercept)                        loan_amnt                       emp_length  
                      6.495e+00                        1.238e-04                        2.940e-03  
                 home_ownership              verification_status                          purpose  
                      1.369e-01                        8.660e-01                        3.471e-01  
                     addr_state                      delinq_2yrs                 earliest_cr_line  
                      1.515e-03                        1.398e-02                        2.024e-09  
                 inq_last_6mths                         open_acc                          pub_rec  
                      1.008e+00                        6.684e-02                        3.921e-01  
                      revol_bal                       revol_util                        total_acc  
                      4.134e-06                        4.416e-02                       -3.255e-02  
            initial_list_status       collections_12_mths_ex_med                   acc_now_delinq  
                     -6.204e-01                        3.396e-01                        1.791e+00  
                   tot_coll_amt                      tot_cur_bal                      open_acc_6m  
                      1.774e-05                       -1.541e-06                        1.707e-01  
                     open_il_6m                      open_il_12m                      open_il_24m  
                     -2.146e-01                        6.587e-01                       -1.285e-01  
             mths_since_rcnt_il                     total_bal_il                          il_util  
                     -9.629e-03                        4.188e-06                       -7.130e-03  
                    open_rv_12m                      open_rv_24m                       max_bal_bc  
                      5.293e-02                        1.003e-01                       -1.012e-04  
                       all_util                 total_rev_hi_lim                           inq_fi  
                      6.933e-03                       -2.038e-05                        1.058e-03  
                    total_cu_tl                     inq_last_12m                annual_inc_merged  
                     -7.185e-02                        5.545e-02                       -4.952e-06  
                     dti_merged            mths_since_delinq_cat       mths_since_last_record_cat  
                      7.052e-02                       -2.070e-01                       -1.483e-01  
mths_since_last_major_derog_cat  
                     -1.465e-01  


[[3]]

Call:
lm(formula = int_rate ~ ., data = train_data_fold)

Coefficients:
                    (Intercept)                        loan_amnt                       emp_length  
                      6.795e+00                        1.227e-04                        3.673e-03  
                 home_ownership              verification_status                          purpose  
                      1.796e-01                        8.496e-01                        3.794e-01  
                     addr_state                      delinq_2yrs                 earliest_cr_line  
                      2.056e-03                        4.228e-02                        2.071e-09  
                 inq_last_6mths                         open_acc                          pub_rec  
                      1.040e+00                        4.118e-02                        3.960e-01  
                      revol_bal                       revol_util                        total_acc  
                     -8.947e-06                        5.120e-02                       -2.648e-02  
            initial_list_status       collections_12_mths_ex_med                   acc_now_delinq  
                     -7.368e-01                        4.090e-01                        1.264e+00  
                   tot_coll_amt                      tot_cur_bal                      open_acc_6m  
                      3.001e-05                       -1.351e-06                        3.791e-03  
                     open_il_6m                      open_il_12m                      open_il_24m  
                     -1.259e-01                        7.328e-01                       -1.338e-01  
             mths_since_rcnt_il                     total_bal_il                          il_util  
                     -1.066e-02                        1.841e-06                       -6.795e-03  
                    open_rv_12m                      open_rv_24m                       max_bal_bc  
                      2.146e-01                       -7.199e-03                       -8.579e-05  
                       all_util                 total_rev_hi_lim                           inq_fi  
                      4.057e-03                       -1.006e-06                        5.499e-02  
                    total_cu_tl                     inq_last_12m                annual_inc_merged  
                     -5.518e-02                        6.357e-02                       -9.088e-06  
                     dti_merged            mths_since_delinq_cat       mths_since_last_record_cat  
                      6.126e-02                       -2.122e-01                       -2.423e-01  
mths_since_last_major_derog_cat  
                     -1.384e-01  


[[4]]

Call:
lm(formula = int_rate ~ ., data = train_data_fold)

Coefficients:
                    (Intercept)                        loan_amnt                       emp_length  
                      6.669e+00                        1.203e-04                        8.399e-03  
                 home_ownership              verification_status                          purpose  
                      1.705e-01                        8.574e-01                        3.508e-01  
                     addr_state                      delinq_2yrs                 earliest_cr_line  
                      9.598e-04                        5.734e-02                        2.017e-09  
                 inq_last_6mths                         open_acc                          pub_rec  
                      9.963e-01                        6.263e-02                        3.850e-01  
                      revol_bal                       revol_util                        total_acc  
                      1.191e-05                        4.117e-02                       -3.385e-02  
            initial_list_status       collections_12_mths_ex_med                   acc_now_delinq  
                     -6.315e-01                        2.786e-01                        1.662e+00  
                   tot_coll_amt                      tot_cur_bal                      open_acc_6m  
                      1.838e-05                       -9.500e-07                       -3.635e-02  
                     open_il_6m                      open_il_12m                      open_il_24m  
                     -1.334e-01                        4.343e-01                        1.271e-01  
             mths_since_rcnt_il                     total_bal_il                          il_util  
                     -8.521e-03                        4.237e-06                       -4.376e-03  
                    open_rv_12m                      open_rv_24m                       max_bal_bc  
                      7.466e-02                        1.385e-01                       -6.254e-05  
                       all_util                 total_rev_hi_lim                           inq_fi  
                     -7.971e-03                       -2.401e-05                        1.278e-01  
                    total_cu_tl                     inq_last_12m                annual_inc_merged  
                     -1.062e-01                        5.820e-02                       -4.855e-06  
                     dti_merged            mths_since_delinq_cat       mths_since_last_record_cat  
                      6.929e-02                       -1.944e-01                       -1.617e-01  
mths_since_last_major_derog_cat  
                     -1.483e-01  


[[5]]

Call:
lm(formula = int_rate ~ ., data = train_data_fold)

Coefficients:
                    (Intercept)                        loan_amnt                       emp_length  
                      6.625e+00                        1.279e-04                        1.136e-02  
                 home_ownership              verification_status                          purpose  
                      1.935e-01                        8.283e-01                        3.525e-01  
                     addr_state                      delinq_2yrs                 earliest_cr_line  
                      1.137e-03                       -6.451e-03                        2.030e-09  
                 inq_last_6mths                         open_acc                          pub_rec  
                      1.054e+00                        6.369e-02                        4.255e-01  
                      revol_bal                       revol_util                        total_acc  
                      6.297e-06                        4.456e-02                       -3.225e-02  
            initial_list_status       collections_12_mths_ex_med                   acc_now_delinq  
                     -5.496e-01                        5.413e-01                        1.546e+00  
                   tot_coll_amt                      tot_cur_bal                      open_acc_6m  
                      2.647e-05                       -9.294e-07                        3.598e-02  
                     open_il_6m                      open_il_12m                      open_il_24m  
                     -1.076e-01                        5.165e-01                        5.002e-02  
             mths_since_rcnt_il                     total_bal_il                          il_util  
                     -3.113e-03                        1.363e-06                       -1.340e-03  
                    open_rv_12m                      open_rv_24m                       max_bal_bc  
                      1.594e-01                       -2.279e-02                       -8.140e-05  
                       all_util                 total_rev_hi_lim                           inq_fi  
                     -8.735e-03                       -2.197e-05                        2.062e-02  
                    total_cu_tl                     inq_last_12m                annual_inc_merged  
                     -6.251e-02                        1.092e-01                       -7.380e-06  
                     dti_merged            mths_since_delinq_cat       mths_since_last_record_cat  
                      6.384e-02                       -2.054e-01                       -1.808e-01  
mths_since_last_major_derog_cat  
                     -1.441e-01  


[[6]]

Call:
lm(formula = int_rate ~ ., data = train_data_fold)

Coefficients:
                    (Intercept)                        loan_amnt                       emp_length  
                      6.226e+00                        1.216e-04                        3.531e-04  
                 home_ownership              verification_status                          purpose  
                      1.819e-01                        8.539e-01                        3.753e-01  
                     addr_state                      delinq_2yrs                 earliest_cr_line  
                      2.751e-04                        2.613e-02                        2.194e-09  
                 inq_last_6mths                         open_acc                          pub_rec  
                      1.050e+00                        4.567e-02                        5.423e-01  
                      revol_bal                       revol_util                        total_acc  
                     -8.489e-06                        5.094e-02                       -2.840e-02  
            initial_list_status       collections_12_mths_ex_med                   acc_now_delinq  
                     -7.601e-01                        4.038e-01                        1.302e+00  
                   tot_coll_amt                      tot_cur_bal                      open_acc_6m  
                      2.311e-05                       -1.091e-06                        1.343e-01  
                     open_il_6m                      open_il_12m                      open_il_24m  
                     -1.506e-01                        6.102e-01                        4.087e-02  
             mths_since_rcnt_il                     total_bal_il                          il_util  
                     -7.501e-03                        4.745e-06                       -3.830e-03  
                    open_rv_12m                      open_rv_24m                       max_bal_bc  
                      2.662e-01                       -1.898e-02                       -9.227e-05  
                       all_util                 total_rev_hi_lim                           inq_fi  
                     -4.138e-03                       -1.634e-06                       -5.819e-03  
                    total_cu_tl                     inq_last_12m                annual_inc_merged  
                     -4.751e-02                        5.149e-02                       -1.120e-05  
                     dti_merged            mths_since_delinq_cat       mths_since_last_record_cat  
                      5.727e-02                       -2.382e-01                       -9.641e-02  
mths_since_last_major_derog_cat  
                     -1.312e-01  


[[7]]

Call:
lm(formula = int_rate ~ ., data = train_data_fold)

Coefficients:
                    (Intercept)                        loan_amnt                       emp_length  
                      6.292e+00                        1.187e-04                        2.387e-03  
                 home_ownership              verification_status                          purpose  
                      1.676e-01                        8.765e-01                        3.491e-01  
                     addr_state                      delinq_2yrs                 earliest_cr_line  
                      1.294e-03                        1.753e-02                        2.087e-09  
                 inq_last_6mths                         open_acc                          pub_rec  
                      1.026e+00                        6.105e-02                        4.709e-01  
                      revol_bal                       revol_util                        total_acc  
                      3.357e-06                        4.449e-02                       -3.498e-02  
            initial_list_status       collections_12_mths_ex_med                   acc_now_delinq  
                     -6.449e-01                        2.629e-01                        1.268e+00  
                   tot_coll_amt                      tot_cur_bal                      open_acc_6m  
                      1.447e-05                       -1.594e-06                       -7.157e-02  
                     open_il_6m                      open_il_12m                      open_il_24m  
                     -4.692e-02                        4.124e-01                        8.638e-02  
             mths_since_rcnt_il                     total_bal_il                          il_util  
                     -7.308e-03                        9.496e-07                       -5.300e-03  
                    open_rv_12m                      open_rv_24m                       max_bal_bc  
                      7.600e-02                        1.171e-01                       -7.151e-05  
                       all_util                 total_rev_hi_lim                           inq_fi  
                     -8.874e-03                       -1.923e-05                        1.056e-02  
                    total_cu_tl                     inq_last_12m                annual_inc_merged  
                      1.132e-02                        3.502e-02                       -3.045e-06  
                     dti_merged            mths_since_delinq_cat       mths_since_last_record_cat  
                      7.089e-02                       -2.075e-01                       -1.125e-01  
mths_since_last_major_derog_cat  
                     -1.654e-01  


[[8]]

Call:
lm(formula = int_rate ~ ., data = train_data_fold)

Coefficients:
                    (Intercept)                        loan_amnt                       emp_length  
                      6.209e+00                        1.248e-04                        1.160e-02  
                 home_ownership              verification_status                          purpose  
                      1.773e-01                        8.651e-01                        3.504e-01  
                     addr_state                      delinq_2yrs                 earliest_cr_line  
                      5.853e-04                        3.050e-02                        2.052e-09  
                 inq_last_6mths                         open_acc                          pub_rec  
                      9.914e-01                        6.241e-02                        4.580e-01  
                      revol_bal                       revol_util                        total_acc  
                      5.356e-06                        4.453e-02                       -3.211e-02  
            initial_list_status       collections_12_mths_ex_med                   acc_now_delinq  
                     -6.198e-01                        3.945e-01                        1.584e+00  
                   tot_coll_amt                      tot_cur_bal                      open_acc_6m  
                      4.597e-05                       -1.178e-06                        5.436e-02  
                     open_il_6m                      open_il_12m                      open_il_24m  
                     -2.002e-01                        8.935e-01                       -1.549e-01  
             mths_since_rcnt_il                     total_bal_il                          il_util  
                     -1.179e-02                        2.674e-06                       -3.619e-03  
                    open_rv_12m                      open_rv_24m                       max_bal_bc  
                      1.913e-01                        5.839e-02                       -3.624e-05  
                       all_util                 total_rev_hi_lim                           inq_fi  
                     -5.312e-03                       -2.178e-05                        1.241e-01  
                    total_cu_tl                     inq_last_12m                annual_inc_merged  
                     -5.658e-02                        4.237e-02                       -6.659e-06  
                     dti_merged            mths_since_delinq_cat       mths_since_last_record_cat  
                      6.692e-02                       -1.977e-01                       -1.024e-01  
mths_since_last_major_derog_cat  
                     -1.458e-01  


[[9]]

Call:
lm(formula = int_rate ~ ., data = train_data_fold)

Coefficients:
                    (Intercept)                        loan_amnt                       emp_length  
                      6.183e+00                        1.192e-04                       -3.819e-03  
                 home_ownership              verification_status                          purpose  
                      1.472e-01                        8.480e-01                        3.663e-01  
                     addr_state                      delinq_2yrs                 earliest_cr_line  
                      3.031e-03                       -1.195e-02                        2.066e-09  
                 inq_last_6mths                         open_acc                          pub_rec  
                      9.837e-01                        5.603e-02                        4.285e-01  
                      revol_bal                       revol_util                        total_acc  
                      5.150e-06                        4.455e-02                       -2.954e-02  
            initial_list_status       collections_12_mths_ex_med                   acc_now_delinq  
                     -6.202e-01                        1.077e-01                        7.956e-01  
                   tot_coll_amt                      tot_cur_bal                      open_acc_6m  
                      3.526e-05                       -1.392e-06                        2.585e-02  
                     open_il_6m                      open_il_12m                      open_il_24m  
                     -1.490e-01                        6.185e-01                        2.844e-02  
             mths_since_rcnt_il                     total_bal_il                          il_util  
                     -4.387e-03                        4.846e-07                       -8.214e-04  
                    open_rv_12m                      open_rv_24m                       max_bal_bc  
                      4.166e-02                        1.129e-01                       -8.249e-05  
                       all_util                 total_rev_hi_lim                           inq_fi  
                     -5.746e-03                       -2.086e-05                       -2.847e-02  
                    total_cu_tl                     inq_last_12m                annual_inc_merged  
                     -8.818e-02                        7.265e-02                       -4.097e-06  
                     dti_merged            mths_since_delinq_cat       mths_since_last_record_cat  
                      6.711e-02                       -2.058e-01                       -1.159e-01  
mths_since_last_major_derog_cat  
                     -1.271e-01  


[[10]]

Call:
lm(formula = int_rate ~ ., data = train_data_fold)

Coefficients:
                    (Intercept)                        loan_amnt                       emp_length  
                      6.620e+00                        1.237e-04                        3.628e-03  
                 home_ownership              verification_status                          purpose  
                      1.518e-01                        8.846e-01                        3.535e-01  
                     addr_state                      delinq_2yrs                 earliest_cr_line  
                      2.738e-04                        5.111e-02                        2.013e-09  
                 inq_last_6mths                         open_acc                          pub_rec  
                      1.007e+00                        6.695e-02                        3.318e-01  
                      revol_bal                       revol_util                        total_acc  
                      5.070e-06                        4.422e-02                       -3.177e-02  
            initial_list_status       collections_12_mths_ex_med                   acc_now_delinq  
                     -6.139e-01                        1.075e-01                        1.207e+00  
                   tot_coll_amt                      tot_cur_bal                      open_acc_6m  
                      2.896e-05                       -1.315e-06                        5.319e-02  
                     open_il_6m                      open_il_12m                      open_il_24m  
                     -1.678e-01                        4.041e-01                        9.409e-02  
             mths_since_rcnt_il                     total_bal_il                          il_util  
                     -1.282e-02                        1.377e-06                        1.857e-04  
                    open_rv_12m                      open_rv_24m                       max_bal_bc  
                      3.216e-01                       -1.583e-02                       -9.745e-05  
                       all_util                 total_rev_hi_lim                           inq_fi  
                     -2.326e-03                       -2.255e-05                        4.121e-02  
                    total_cu_tl                     inq_last_12m                annual_inc_merged  
                     -1.113e-01                        7.710e-02                       -5.135e-06  
                     dti_merged            mths_since_delinq_cat       mths_since_last_record_cat  
                      6.467e-02                       -1.850e-01                       -2.054e-01  
mths_since_last_major_derog_cat  
                     -1.184e-01  
print(results)


#### Decision Trees ####

# Error in tree: "factor predictors must have at most 32 levels" is thrown.
# Basically, it becomes computationally expensive to create so many splits in your data, since you are selecting the best split out of all 2^32 (approx) possible splits.


# Fit a decision tree model on the training data
#tm <- tree(int_rate ~ ., data = sampled_train_data)

# Make predictions on the training and testing data
#tm.train_predictions <- predict(tm, newdata = sampled_train_data)
#tm.test_predictions <- predict(tm, newdata = sampled_test_data)

# Calculate Mean Squared Error (MSE) for training and testing
#tm.train_mse <- mean((tm.train_predictions - sampled_train_data$int_rate)^2)
#tm.test_mse <- mean((tm.test_predictions - sampled_test_data$int_rate)^2)

# Calculate Root Mean Squared Error (RMSE) for training and testing
#tm.train_rmse <- sqrt(tm.train_mse)
#tm.test_rmse <- sqrt(tm.test_mse)

# Calculate Mean Absolute Error (MAE) for training and testing
#tm.train_mae <- mean(abs(tm.train_predictions - sampled_train_data$int_rate))
#tm.test_mae <- mean(abs(tm.test_predictions - sampled_test_data$int_rate))

# Calculate R-squared (R²) for training and testing
#tm.train_r2 <- 1 - (sum((sampled_train_data$int_rate - tm.train_predictions)^2) / sum((sampled_train_data$int_rate - mean(sampled_train_data$int_rate))^2))
#tm.test_r2 <- 1 - (sum((sampled_test_data$int_rate - tm.test_predictions)^2) / sum((sampled_test_data$int_rate - mean(sampled_test_data$int_rate))^2))

# Display the metrics
#cat("Training MSE:", tm.train_mse, "\n")
#cat("Testing MSE:", tm.test_mse, "\n")
#cat("Training RMSE:", tm.train_rmse, "\n")
#cat("Testing RMSE:", tm.test_rmse, "\n")
#cat("Training MAE:", tm.train_mae, "\n")
#cat("Testing MAE:", tm.test_mae, "\n")
#cat("Training R-squared (R²):", tm.train_r2, "\n")
#cat("Testing R-squared (R²):", tm.test_r2, "\n")

#### Random Forest ####

# Train a Random Forest model
rf <- ranger(formula = int_rate ~ ., data = sampled_train_data, num.trees = 500, verbose=TRUE, importance = "impurity", oob.error = TRUE)
Growing trees.. Progress: 11%. Estimated remaining time: 4 minutes, 0 seconds.
Growing trees.. Progress: 24%. Estimated remaining time: 3 minutes, 17 seconds.
Growing trees.. Progress: 37%. Estimated remaining time: 2 minutes, 41 seconds.
Growing trees.. Progress: 50%. Estimated remaining time: 2 minutes, 7 seconds.
Growing trees.. Progress: 63%. Estimated remaining time: 1 minute, 33 seconds.
Growing trees.. Progress: 75%. Estimated remaining time: 1 minute, 2 seconds.
Growing trees.. Progress: 87%. Estimated remaining time: 33 seconds.
Growing trees.. Progress: 99%. Estimated remaining time: 1 seconds.
# Print the model summary
print("Random Forest Model Summary:")
[1] "Random Forest Model Summary:"
print(rf)
Ranger result

Call:
 ranger(formula = int_rate ~ ., data = sampled_train_data, num.trees = 500,      verbose = TRUE, importance = "impurity", oob.error = TRUE) 

Type:                             Regression 
Number of trees:                  500 
Sample size:                      638392 
Number of independent variables:  39 
Mtry:                             6 
Target node size:                 5 
Variable importance mode:         impurity 
Splitrule:                        variance 
OOB prediction error (MSE):       11.08217 
R squared (OOB):                  0.4229489 
# Make predictions on the training and testing data
rf.train_predictions <- predict(rf, data = sampled_train_data)
Predicting.. Progress: 73%. Estimated remaining time: 11 seconds.
rf.test_predictions <- predict(rf, data = sampled_test_data)

# Calculate Mean Squared Error (MSE) for training and testing
rf.train_mse <- mean((rf.train_predictions$predictions - sampled_train_data$int_rate)^2)
rf.test_mse <- mean((rf.test_predictions$predictions - sampled_test_data$int_rate)^2)

# Calculate Root Mean Squared Error (RMSE) for training and testing
rf.train_rmse <- sqrt(rf.train_mse)
rf.test_rmse <- sqrt(rf.test_mse)

# Calculate Mean Absolute Error (MAE) for training and testing
rf.train_mae <- mean(abs(rf.train_predictions$predictions - sampled_train_data$int_rate))
rf.test_mae <- mean(abs(rf.test_predictions$predictions - sampled_test_data$int_rate))

# Calculate R-squared (R²) for training and testing
rf.train_r2 <- 1 - (sum((sampled_train_data$int_rate - rf.train_predictions$predictions)^2) / sum((sampled_train_data$int_rate - mean(sampled_train_data$int_rate))^2))
rf.test_r2 <- 1 - (sum((sampled_test_data$int_rate - rf.test_predictions$predictions)^2) / sum((sampled_test_data$int_rate - mean(sampled_test_data$int_rate))^2))

# Display the metrics
cat("Training MSE:", rf.train_mse, "\n")
Training MSE: 2.572857 
cat("Testing MSE:", rf.test_mse, "\n")
Testing MSE: 11.01728 
cat("Training RMSE:", rf.train_rmse, "\n")
Training RMSE: 1.604013 
cat("Testing RMSE:", rf.test_rmse, "\n")
Testing RMSE: 3.319228 
cat("Training MAE:", rf.train_mae, "\n")
Training MAE: 1.260271 
cat("Testing MAE:", rf.test_mae, "\n")
Testing MAE: 2.6258 
cat("Training R-squared (R²):", rf.train_r2, "\n")
Training R-squared (R²): 0.8660306 
cat("Testing R-squared (R²):", rf.test_r2, "\n")
Testing R-squared (R²): 0.4260632 
#rf <- randomForest(int_rate~., data=train_data, ntree = 5, mtry = 3)
#bag.boston=randomForest(medv~.,data=Boston,subset=train, mtry=13,importance =TRUE)
#print(rf)

# Set the number of cores you want to use
#num_cores <- 6  # Adjust this number based on your system's capabilities

# Register parallel backend
#cl <- makeCluster(num_cores)
#registerDoParallel(cl)

# Assuming 'lc_data' is your dataset
#rf_model <- foreach(ntree = rep(100, num_cores), .packages = 'randomForest') %dopar% {
#    randomForest(int_rate ~ ., data = lc_data, ntree = ntree, mtry = sqrt(ncol(lc_data)))
#}

# After training, stop the cluster to release the cores:
#stopCluster(cl)

#### Boosting ####

# Define the target variable for training and testing
xgb.y_train <- sampled_train_data$int_rate
xgb.y_test <- sampled_test_data$int_rate  # Use sampled_test_data for testing

# Define the feature matrix for training and testing (exclude the target variable)
xgb.X_train <- sampled_train_data[, -which(names(sampled_train_data) == 'int_rate')]
xgb.X_test <- sampled_test_data[, -which(names(sampled_test_data) == 'int_rate')]  # Use sampled_test_data for testing

# Fit a gradient boosting regression model using xgboost
xgb <- xgboost(
  data = as.matrix(xgb.X_train),
  label = xgb.y_train,
  nrounds = 100,
  verbose = 0
)

# Make predictions on the training and testing data
xgb.train_predictions <- predict(xgb, newdata = as.matrix(xgb.X_train))
xgb.test_predictions <- predict(xgb, newdata = as.matrix(xgb.X_test))

# Calculate Mean Squared Error (MSE) for training and testing
xgb.train_mse <- mean((xgb.train_predictions - xgb.y_train)^2)
xgb.test_mse <- mean((xgb.test_predictions - xgb.y_test)^2)

# Calculate Root Mean Squared Error (RMSE) for training and testing
xgb.train_rmse <- sqrt(xgb.train_mse)
xgb.test_rmse <- sqrt(xgb.test_mse)

# Calculate Mean Absolute Error (MAE) for training and testing
xgb.train_mae <- mean(abs(xgb.train_predictions - xgb.y_train))
xgb.test_mae <- mean(abs(xgb.test_predictions - xgb.y_test))

# Calculate R-squared (R²) for training and testing
xgb.train_r2 <- 1 - (sum((xgb.y_train - xgb.train_predictions)^2) / sum((xgb.y_train - mean(xgb.y_train))^2))
xgb.test_r2 <- 1 - (sum((xgb.y_test - xgb.test_predictions)^2) / sum((xgb.y_test - mean(xgb.y_test))^2))

# Display the metrics
cat("Training MSE:", xgb.train_mse, "\n")
Training MSE: 9.918589 
cat("Testing MSE:", xgb.test_mse, "\n")
Testing MSE: 10.29675 
cat("Training RMSE:", xgb.train_rmse, "\n")
Training RMSE: 3.149379 
cat("Testing RMSE:", xgb.test_rmse, "\n")
Testing RMSE: 3.208854 
cat("Training MAE:", xgb.train_mae, "\n")
Training MAE: 2.475425 
cat("Testing MAE:", xgb.test_mae, "\n")
Testing MAE: 2.522647 
cat("Training R-squared (R²):", xgb.train_r2, "\n")
Training R-squared (R²): 0.4835362 
cat("Testing R-squared (R²):", xgb.test_r2, "\n")
Testing R-squared (R²): 0.4635987 

Following, a scatter plot of actual vs predicted training values for each model is plot. This plot helps us visualize how well each model’s predictions align with the actual data points.

# Create a scatter plot function
create_scatter_plot <- function(actual_values, predicted_values, model_name) {
  model_comparison_data <- data.frame(
    Actual = actual_values,
    Predicted = predicted_values
  )
  
  scatter_plot <- ggplot(model_comparison_data, aes(x = Actual, y = Predicted)) +
    geom_point() +
    geom_abline(intercept = 0, slope = 1, linetype = "dashed", color = "red") +  # Add a diagonal reference line
    labs(x = "Actual Training Values", y = "Predicted Training Values", title = model_name) +
    theme_minimal() +
    ylim(-50, 50)
  
  return(scatter_plot)
}

# Create scatter plots for each model
lm_scatter_plot <- create_scatter_plot(
  actual_values = sampled_train_data$int_rate,
  predicted_values = lm.train_predictions,
  model_name = "Linear Regression"
)

rf_scatter_plot <- create_scatter_plot(
  actual_values = sampled_train_data$int_rate,
  predicted_values = rf.train_predictions$predictions,
  model_name = "Random Forest"
)

xgb_scatter_plot <- create_scatter_plot(
  actual_values = xgb.y_train,
  predicted_values = xgb.train_predictions,
  model_name = "XGBoost"
)

# Display the scatter plots separately
print(lm_scatter_plot)

print(rf_scatter_plot)

print(xgb_scatter_plot)

Following, a scatter plot of actual vs predicted testing values for each model is plot. This plot helps us visualize how well each model’s predictions align with the actual data points.

# Create a scatter plot function
create_scatter_plot <- function(actual_values, predicted_values, model_name) {
  model_comparison_data <- data.frame(
    Actual = actual_values,
    Predicted = predicted_values
  )
  
  scatter_plot <- ggplot(model_comparison_data, aes(x = Actual, y = Predicted)) +
    geom_point() +
    geom_abline(intercept = 0, slope = 1, linetype = "dashed", color = "red") +  # Add a diagonal reference line
    labs(x = "Actual Testing Values", y = "Predicted Testing Values", title = model_name) +
    theme_minimal() +
    ylim(-50, 50)
  
  return(scatter_plot)
}

# Create scatter plots for each model
lm_scatter_plot <- create_scatter_plot(
  actual_values = sampled_test_data$int_rate,
  predicted_values = lm.test_predictions,
  model_name = "Linear Regression"
)

rf_scatter_plot <- create_scatter_plot(
  actual_values = sampled_test_data$int_rate,
  predicted_values = rf.test_predictions$predictions,
  model_name = "Random Forest"
)

xgb_scatter_plot <- create_scatter_plot(
  actual_values = xgb.y_test,
  predicted_values = xgb.test_predictions,
  model_name = "XGBoost"
)

# Display the scatter plots separately
print(lm_scatter_plot)

print(rf_scatter_plot)

print(xgb_scatter_plot)

Residual plots can help identify patterns in prediction errors and assess whether the assumptions of linear regression (if applicable) are met.

# Create a residual plot function
create_residual_plot <- function(actual_values, predicted_values, model_name) {
  residuals <- actual_values - predicted_values
  residual_data <- data.frame(
    Predicted = predicted_values,
    Residuals = residuals
  )
  
  residual_plot <- ggplot(residual_data, aes(x = Predicted, y = Residuals)) +
    geom_point() +
    geom_hline(yintercept = 0, linetype = "dashed", color = "red") +  # Red horizontal reference line
    labs(x = "Predicted Values", y = "Residuals", title = paste("Residual Plot -", model_name)) +
    theme_minimal() +
    ylim(-30, 30) +
    xlim(0, 40)
  
  return(residual_plot)
}

# Create residual plots for each model
lm_residual_plot <- create_residual_plot(
  actual_values = sampled_train_data$int_rate,
  predicted_values = lm.train_predictions,
  model_name = "Linear Regression"
)

rf_residual_plot <- create_residual_plot(
  actual_values = sampled_train_data$int_rate,
  predicted_values = rf.train_predictions$predictions,
  model_name = "Random Forest"
)

xgb_residual_plot <- create_residual_plot(
  actual_values = xgb.y_train,
  predicted_values = xgb.train_predictions,
  model_name = "XGBoost"
)

# Display the residual plots separately
print(lm_residual_plot)

print(rf_residual_plot)

print(xgb_residual_plot)

From the plots above we can clearly see that:

This visualization can help you compare the distribution of prediction errors across models.

# Create a density plot function for residuals
create_residual_density_plot <- function(actual_values, predicted_values, model_name) {
  residuals <- actual_values - predicted_values
  residual_data <- data.frame(Residuals = residuals)
  
  density_plot <- ggplot(residual_data, aes(x = Residuals)) +
    geom_density(fill = "skyblue", color = "black", alpha = 0.7) +
    labs(x = "Residuals", y = "Density", title = paste("Residual Density Plot -", model_name)) +
    theme_minimal()
  
  return(density_plot)
}

# Create density plots for residuals for each model
lm_residual_density_plot <- create_residual_density_plot(
  actual_values = sampled_train_data$int_rate,
  predicted_values = lm.train_predictions,
  model_name = "Linear Regression"
)

rf_residual_density_plot <- create_residual_density_plot(
  actual_values = sampled_train_data$int_rate,
  predicted_values = rf.train_predictions$predictions,
  model_name = "Random Forest"
)

xgb_residual_density_plot <- create_residual_density_plot(
  actual_values = xgb.y_train,
  predicted_values = xgb.train_predictions,
  model_name = "XGBoost"
)

# Display the density plots separately
print(lm_residual_density_plot)

print(rf_residual_density_plot)

print(xgb_residual_density_plot)

This visualization can help you compare the distribution of prediction errors across models through histograms.

# Create a histogram plot function for residuals with a red density curve
create_residual_histogram_plot <- function(actual_values, predicted_values, model_name) {
  residuals <- actual_values - predicted_values
  residual_data <- data.frame(Residuals = residuals)
  
  histogram_plot <- ggplot(residual_data, aes(x = Residuals)) +
    geom_histogram(aes(y = after_stat(density)), bins = 30, fill = "skyblue", color = "black", alpha = 0.7) +  # Use density on the y-axis for the histogram
    geom_density(color = "red", linewidth = 1.5) +  # Add the density plot in red
    labs(x = "Residuals", y = "Density", title = paste("Residual Histogram Plot with Density Curve -", model_name)) +
    theme_minimal() +
    xlim(-20,20) + 
    ylim(0, 0.3)
  
  return(histogram_plot)
}

# Create histogram plots for residuals for each model
lm_residual_histogram_plot <- create_residual_histogram_plot(
  actual_values = sampled_train_data$int_rate,
  predicted_values = lm.train_predictions,
  model_name = "Linear Regression"
)

rf_residual_histogram_plot <- create_residual_histogram_plot(
  actual_values = sampled_train_data$int_rate,
  predicted_values = rf.train_predictions$predictions,
  model_name = "Random Forest"
)

xgb_residual_histogram_plot <- create_residual_histogram_plot(
  actual_values = xgb.y_train,
  predicted_values = xgb.train_predictions,
  model_name = "XGBoost"
)

# Display the histogram plots separately
print(lm_residual_histogram_plot)

print(rf_residual_histogram_plot)

print(xgb_residual_histogram_plot)

For each model a bar chart that displays the R-squared (coefficient of determination) values is created. R-squared measures the proportion of variance in the target variable explained by the model. Higher R-squared values indicate better model fit.

# Create a data frame with R-squared values for each model
model_names <- c("Linear Regression", "Random Forest", "XGBoost")
r_squared_values <- c(
  lm.train_r2,
  rf.train_r2,
  xgb.train_r2
)

r_squared_data <- data.frame(Model = factor(model_names),
                              R_squared = r_squared_values)

# Create the R-squared comparison bar chart
r_squared_bar_chart <- ggplot(r_squared_data, aes(x = Model, y = R_squared, fill = Model)) +
  geom_bar(stat = "identity") +
  labs(x = "Model", y = "R-squared (R²)", title = "R-squared Comparison") +
  theme_minimal() +
  theme(axis.text.x = element_text(angle = 45, hjust = 1))

# Display the R-squared comparison bar chart
print(r_squared_bar_chart)

A bar chart that compares the MAE or RMSE values, is generated for each model. These metrics quantify the average prediction errors of each model, and lower values are preferred.

# Create a data frame with MAE and RMSE values for each model
model_names <- c("Linear Regression", "Random Forest", "XGBoost","Linear Regression", "Random Forest", "XGBoost")
error_values_train <- c(
  lm.train_mae,
  rf.train_mae,
  xgb.train_mae,
  lm.train_rmse,
  rf.train_rmse,
  xgb.train_rmse
)
error_values_test <- c(
  lm.test_mae,
  rf.test_mae,
  xgb.test_mae,
  lm.test_rmse,
  rf.test_rmse,
  xgb.test_rmse
)
error_type <- c(
  "MAE", "MAE", "MAE","RMSE","RMSE","RMSE"
)
model_errors_train <- data.frame(Model = factor(model_names, levels = c("Linear Regression", "Random Forest", "XGBoost")),
                Error = error_values_train, Type = error_type)
model_errors_test <- data.frame(Model = factor(model_names, levels = c("Linear Regression", "Random Forest", "XGBoost")),
                Error = error_values_test, Type = error_type)
# Create the MAE or RMSE comparison bar chart
error_bar_chart_train <- ggplot(model_errors_train, aes(x = Model, y = Error, fill = Type)) +
  geom_bar(stat = "identity", position = "dodge") +
  labs(x = "Model", y = "Error Value", title = "Training MAE and RMSE Comparison") +
  theme_minimal() +
  theme(axis.text.x = element_text(angle = 45, hjust = 1)) + 
  ylim(0, 4)

error_bar_chart_test <- ggplot(model_errors_test, aes(x = Model, y = Error, fill = Type)) +
  geom_bar(stat = "identity", position = "dodge") +
  labs(x = "Model", y = "Error Value", title = "Testing MAE and RMSE Comparison") +
  theme_minimal() +
  theme(axis.text.x = element_text(angle = 45, hjust = 1)) + 
  ylim(0, 4)

# Display the MAE and RMSE comparison bar chart
print(error_bar_chart_train)

print(error_bar_chart_test)

#### Random Forest Feature Importance Plot ####
v1 <- vip(rf, title = "Ranger", num_features = 20) 
plot(v1)

Learning curve using RMSE and R^2:

# TODO: change the x-axes
# Create a data frame with RMSE and R-squared values for each model and sample size
model_names <- c("Linear Regression", "Random Forest", "XGBoost")
sample_sizes <- seq(10, nrow(sampled_train_data), by = 10)  # Adjust the sample sizes as needed

# Create data frames with RMSE and R-squared values for each model
rmse_data <- data.frame(
  Model = rep(model_names, each = length(sample_sizes)),
  Sample_Size = rep(sample_sizes, times = length(model_names)),
  RMSE = c(
    lm.train_rmse, rf.train_rmse, xgb.train_rmse
  )
)

r_squared_data <- data.frame(
  Model = rep(model_names, each = length(sample_sizes)),
  Sample_Size = rep(sample_sizes, times = length(model_names)),
  R_squared = c(
    lm.train_r2, rf.train_r2, xgb.train_r2
  )
)

# Create RMSE learning curve
rmse_curve <- ggplot(rmse_data, aes(x = Sample_Size, y = RMSE, color = Model)) +
  geom_line() +
  labs(x = "Sample Size", y = "RMSE", title = "RMSE Learning Curve") +
  theme_minimal()

# Create R-squared learning curve
r_squared_curve <- ggplot(r_squared_data, aes(x = Sample_Size, y = R_squared, color = Model)) +
  geom_line() +
  labs(x = "Sample Size", y = "R-squared", title = "R-squared Learning Curve") +
  theme_minimal()

# Display the RMSE and R-squared learning curves
print(rmse_curve)

print(r_squared_curve)

Add a new chunk by clicking the Insert Chunk button on the toolbar or by pressing Ctrl+Alt+I.

When you save the notebook, an HTML file containing the code and output will be saved alongside it (click the Preview button or press Ctrl+Shift+K to preview the HTML file).

The preview shows you a rendered HTML copy of the contents of the editor. Consequently, unlike Knit, Preview does not run any R code chunks. Instead, the output of the chunk when it was last run in the editor is displayed.

LS0tCnRpdGxlOiAiUiBOb3RlYm9vayIKb3V0cHV0OiBodG1sX25vdGVib29rCi0tLQoKIyBEYXRhIFByZS1wcm9jZXNzaW5nCgpMb2FkIG5lZWRlZCBsaWJyYXJpZXMKCmBgYHtyfQpsaWJyYXJ5KGZhc3REdW1taWVzKQpsaWJyYXJ5KHJlYWRyKQpsaWJyYXJ5KGdncGxvdDIpCmxpYnJhcnkoZHBseXIpCmxpYnJhcnkoY2FyZXQpCmxpYnJhcnkoZ2xtbmV0KQpsaWJyYXJ5KGJvb3QpCmxpYnJhcnkodHJlZSkKbGlicmFyeShyYW5nZXIpCmxpYnJhcnkoeGdib29zdCkKbGlicmFyeShnYm0pCmxpYnJhcnkodmlwKQpsaWJyYXJ5KElTTFIpCmBgYAoKU2V0IHRoZSBzZWVkIGZvciByZXByb2R1Y2liaWxpdHkKCmBgYHtyfQpzZXQuc2VlZCgxKQpgYGAKCkxvYWQgdGhlIGRhdGFzZXQKCmBgYHtyfQpvcmlnaW5hbF9sY19kYXRhIDwtIHJlYWQuY3N2KCJMQ2RhdGEuY3N2IixzZXAgPSAiOyIpCmxjX2RhdGEgPC0gb3JpZ2luYWxfbGNfZGF0YQpgYGAKCnJlbW92ZSBhdHRyaWJ1dGVzIG5vdCBhdmFpbGFibGUgZm9yIHByZWRpY3Rpb24KCmBgYHtyfQpsY19kYXRhIDwtIHN1YnNldChsY19kYXRhLCBzZWxlY3QgPSAtYyhjb2xsZWN0aW9uX3JlY292ZXJ5X2ZlZSwgaW5zdGFsbG1lbnQsIGlzc3VlX2QsCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgIGxhc3RfcHltbnRfYW1udCwgbGFzdF9weW1udF9kLCBsb2FuX3N0YXR1cywKICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgbmV4dF9weW1udF9kLCBvdXRfcHJuY3AsIG91dF9wcm5jcF9pbnYsCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgIHB5bW50X3BsYW4sIHJlY292ZXJpZXMsCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgIHRlcm0sIHRvdGFsX3B5bW50LAogICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICB0b3RhbF9weW1udF9pbnYsdG90YWxfcmVjX2ludCwgdG90YWxfcmVjX2xhdGVfZmVlLCAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgdG90YWxfcmVjX3BybmNwKSkKCmBgYAoKYGBge3J9CnN1bW1hcnkobGNfZGF0YSkKYGBgCgpGaXJzdCB3ZSBkZWxldGUgdGhlIGNvbHVtbnMgd2hpY2ggYXJlbid0IHVzZWZ1bCBmb3Igb3VyIHByZWRpY3Rpb24KCmBgYHtyfQpsY19kYXRhJGlkIDwtIE5VTEwKbGNfZGF0YSRtZW1iZXJfaWQgPC0gTlVMTApsY19kYXRhJHppcF9jb2RlIDwtIE5VTEwKbGNfZGF0YSR1cmwgPC0gTlVMTApgYGAKTG9va3MgbGlrZSAqKnBvbGljeV9jb2RlKiogY29udGFpbnMganVzdCB2YWx1ZSBlcXVhbCB0byAxLCBpdCBjYW4gYmUgcmVtb3ZlZApgYGB7cn0KbGNfZGF0YSRwb2xpY3lfY29kZSA8LSBOVUxMCmBgYApSZW1vdmUgYWRkaXRpb25hbCBjb2x1bW5zIHdoaWNoIGFyZSByZWxhdGVkIHRvIHRoZSBoaXN0b3JpY2FsIGRhdGEKYGBge3J9CmxjX2RhdGEkbGFzdF9jcmVkaXRfcHVsbF9kIDwtIE5VTEwKYGBgCgpUaGVuIHdlIGRlbGV0ZSB0aGUgY29sdW1ucyB3aGljaCBjYW4ndCBiZSBjb252ZXJ0ZWQgdG8gY2F0ZWdvcmljYWwgYW5kIHJlcXVpcmUgTkxQCgpgYGB7cn0KbGNfZGF0YSR0aXRsZSA8LSBOVUxMCmxjX2RhdGEkZGVzYyA8LSBOVUxMCmxjX2RhdGEkZW1wX3RpdGxlIDwtIE5VTEwKCmBgYAoKbGV0J3MgZXhhbWluZSB0aGUgKipsb2FuX2FtbnQqKiBjb2x1bW4KCmBgYHtyfQpzdW0oaXMubmEobGNfZGF0YSRsb2FuX2FtbnQpKQpjb3IobGNfZGF0YSRsb2FuX2FtbnQsIGxjX2RhdGEkaW50X3JhdGUpCmhpc3QobGNfZGF0YSRsb2FuX2FtbnQsIGJyZWFrcyA9IDIwLCBtYWluID0gImxvYW5fYW1udCBkaXN0cmlidXRpb24iLCB4bGFiID0gImxvYW5fYW1udCIsIGNvbCA9ICJsaWdodGJsdWUiLCBib3JkZXIgPSAiYmxhY2siKQpnZ3Bsb3QoZGF0YSA9IGxjX2RhdGEsIG1hcHBpbmcgPSBhZXMoeD1pbnRfcmF0ZSx5PWxvYW5fYW1udCkpICsgZ2VvbV9ib3hwbG90KCkKYGBgCgpzdGFuZGFyZGl6ZSAqKmxvYW5fYW1udCoqCgpgYGB7cn0KI2xjX2RhdGEkbG9hbl9hbW50IDwtIHNjYWxlKGxjX2RhdGEkbG9hbl9hbW50KQpgYGAKCmxldCdzIGV4YW1pbmUgdGhlICoqZnVuZGVkX2FtbnQqKiBjb2x1bW4KCmBgYHtyfQpzdW0oaXMubmEobGNfZGF0YSRmdW5kZWRfYW1udCkpCmNvcihsY19kYXRhJGZ1bmRlZF9hbW50LCBsY19kYXRhJGludF9yYXRlKQpoaXN0KGxjX2RhdGEkZnVuZGVkX2FtbnQsIGJyZWFrcyA9IDIwLCBtYWluID0gImZ1bmRlZF9hbW50IGRpc3RyaWJ1dGlvbiIsIHhsYWIgPSAiZnVuZGVkX2FtbnQiLCBjb2wgPSAibGlnaHRibHVlIiwgYm9yZGVyID0gImJsYWNrIikKYGBgCgphcyB3ZSBjYW4gc2VlLCAqKmZ1bmRlZF9hbW50KiogaXMgYWxtb3N0IHRoZSBzYW1lIGFzIHRoZSAqKmxvYW5fYW1udCoqIGNvbHVtbiwgY29uc2VxdWVudGx5LCB3ZSByZW1vdmUgaXQuCgpgYGB7cn0KbGNfZGF0YSRmdW5kZWRfYW1udCA8LSBOVUxMIApgYGAKCmxldCdzIGV4YW1pbmUgdGhlICoqZnVuZGVkX2FtbnRfaW52KiogY29sdW1uCgpgYGB7cn0Kc3VtKGlzLm5hKGxjX2RhdGEkZnVuZGVkX2FtbnRfaW52KSkKY29yKGxjX2RhdGEkZnVuZGVkX2FtbnRfaW52LCBsY19kYXRhJGludF9yYXRlKQpoaXN0KGxjX2RhdGEkZnVuZGVkX2FtbnRfaW52LCBicmVha3MgPSAyMCwgbWFpbiA9ICJmdW5kZWRfYW1udF9pbnYgZGlzdHJpYnV0aW9uIiwgeGxhYiA9ICJmdW5kZWRfYW1udF9pbnYiLCBjb2wgPSAibGlnaHRibHVlIiwgYm9yZGVyID0gImJsYWNrIikKYGBgCgpyZW1vdmUgKipmdW5kZWRfYW1udF9pbnYqKiBmb3IgdGhlIHNhbWUgcmVhc29uIGFzIGFib3ZlCgpgYGB7cn0KbGNfZGF0YSRmdW5kZWRfYW1udF9pbnYgPC0gTlVMTApgYGAKCmxldCdzIHNlZSB0aGUgKippbnRfcmF0ZSoqIGRpc3RyaWJ1dGlvbi4KYGBge3J9Cmhpc3QobGNfZGF0YSRpbnRfcmF0ZSwgYnJlYWtzID0gMjAsIG1haW4gPSAiaW50X3JhdGUgZGlzdHJpYnV0aW9uIiwgeGxhYiA9ICJpbnRfcmF0ZSIsIGNvbCA9ICJsaWdodGJsdWUiLCBib3JkZXIgPSAiYmxhY2siKQpgYGAKU3RhbmRhcmRpemUgaW50IHJhdGU6CmBgYHtyfQojbGNfZGF0YSRpbnRfcmF0ZSA8LSBzY2FsZShsY19kYXRhJGludF9yYXRlKQpgYGAKd2UgZGVsZXRlIHRoZSAqKmVtcF90aXRsZSoqIGNvbHVtbiBhcyB0aGVyZSBhcmUgc2V2ZXJhbCBlbnRyaWVzIGZvciB0aGUgc2FtZSBqb2IgdGl0bGUgYW5kIGJlY2F1c2UgdGhlcmUgYXJlIHRvbyBtYW55IGRpZmZlcmVudCB2YWx1ZXMgZm9yIG9uZS1ob3QgZW5jb2RpbmcuIEluIGFkZGl0aW9uLCBzb21lIHRpdGxlcyBhcmUgdW5jbGVhciAoTkxQIHJlcXVpcmVkKQpgYGB7cn0Kbl9kaXN0aW5jdChsY19kYXRhJGVtcF90aXRsZSkKYGBgCkFzIHdlIGNhbiBvYnNlcnZlLCB0aGVyZSBhcmUgNDAzNjMgTkFzLiBXZSBjYW4gYXNzdW1lIDQwMzYzIGRvIG5vdCB3b3JrLgpgYGB7cn0KYmFycGxvdCh0YWJsZShsY19kYXRhJGVtcF9sZW5ndGgpLAogICAgICAgIHhsYWIgPSAiZW1wX2xlbmd0aCB5ZWFycyIsIAogICAgICAgIHlsYWIgPSAiRnJlcXVlbmN5IiwgCiAgICAgICAgY29sID0gInNreWJsdWUiLCAKICAgICAgICBib3JkZXIgPSAiYmxhY2siLAogICAgICAgIGNleC5uYW1lcyA9IDAuNikgICMgVGhlIHNpemUgb2YgdGhlIG1haW4gdGl0bGUKYGBgCgpTaW5jZSAqKmVtcF9sZW5ndGgqKiBzZWVtcyB0byBiZSBjYXRlZ29yaWNhbCwgd2UgdHJhbnNmb3JtIGl0IHRvIGFzIGEgZmFjdG9yIGFuZCB0aGVuIGFzIG51bWVyaWMuClRoZSBjb252ZXJzaW9uIHRvIG51bWVyaWMgaXMgbmVlZGVkIGZvciBzdXBwb3J0aW5nIHRoZSBYR0Jvb3N0IApgYGB7cn0KbGNfZGF0YSRlbXBfbGVuZ3RoIDwtIGFzLmZhY3RvcihsY19kYXRhJGVtcF9sZW5ndGgpCmdncGxvdChkYXRhID0gbGNfZGF0YSwgbWFwcGluZyA9IGFlcyh4PWludF9yYXRlLHk9ZW1wX2xlbmd0aCkpICsgZ2VvbV9ib3hwbG90KCkKbGNfZGF0YSRlbXBfbGVuZ3RoIDwtIGFzLm51bWVyaWMobGNfZGF0YSRlbXBfbGVuZ3RoKQpgYGAKCgpDbGVhbmluZyBvZiAqKmhvbWVfb3duZXJzaGlwKio6CgpEdXJpbmcgdGhlIGRhdGEgY2xlYW5pbmcgcGhhc2UsIG91ciBhbmFseXNpcyByZXZlYWxlZCB0aGF0IHRoZSB2YXJpYWJsZSAiaG9tZV9vd25lcnNoaXAiIGRvZXMgbm90IHNob3cgYSBkaXN0aW5jdCBjb3JyZWxhdGlvbiB3aXRoIGludGVyZXN0IHJhdGVzLiBTcGVjaWZpY2FsbHksIGFtb25nIHRoZSBjYXRlZ29yaWVzLCAiQU5ZIiBhbmQgIk9USEVSIiBjb250YWluIDIgYW5kIDE1NCBjYXNlcywgcmVzcGVjdGl2ZWx5LCB3aGlsZSB0aGUgIk5PTkUiIGNhdGVnb3J5IGNvbXByaXNlcyAzOSBjYXNlcy4gQWx0aG91Z2ggdGhlICJOT05FIiBjYXRlZ29yeSBhcHBlYXJzIHRvIGRlbW9uc3RyYXRlIGEgaGlnaGVyIGludGVyZXN0IHJhdGUgY29tcGFyZWQgdG8gb3RoZXJzLCB0aGUgbGltaXRlZCBzYW1wbGUgc2l6ZSBvZiAzOSBjYXNlcyByYWlzZXMgZG91YnRzIGFib3V0IHRoZSByZWxpYWJpbGl0eSBvZiB0aGlzIG9ic2VydmF0aW9uLiBOb3RhYmx5LCB0aGUgIk5PTkUiIGNhdGVnb3J5IG1pZ2h0IHBlcnRhaW4gdG8gaW5kaXZpZHVhbHMgZXhwZXJpZW5jaW5nIGhvbWVsZXNzbmVzcywgcHJvbXB0aW5nIGV0aGljYWwgY29uY2VybnMgYWJvdXQgbG9hbiBwcm92aXNpb24gdG8gdGhpcyBkZW1vZ3JhcGhpYy4KCmBgYHtyfQp0YWJsZShsY19kYXRhJGhvbWVfb3duZXJzaGlwKQpnZ3Bsb3QoZGF0YSA9IGxjX2RhdGEsIG1hcHBpbmcgPSBhZXMoeD1pbnRfcmF0ZSx5PWhvbWVfb3duZXJzaGlwKSkgKyBnZW9tX2JveHBsb3QoKQpgYGAKVGhlbiwgd2UgcmV0YWluIG1vcnRnYWdlLCBvd24gYW5kIHJlbnQ6CmBgYHtyfQpsY19kYXRhIDwtIGxjX2RhdGEgJT4lIGZpbHRlcihob21lX293bmVyc2hpcCAlaW4lIGMoIk1PUlRHQUdFIiwiT1dOIiwiUkVOVCIpKQpsY19kYXRhJGhvbWVfb3duZXJzaGlwIDwtIGFzLm51bWVyaWMoYXMuZmFjdG9yKGxjX2RhdGEkaG9tZV9vd25lcnNoaXApKQpgYGAKCiMgYXBwbGljYXRpb24gam9pbnQgaGFuZGxpbmcKYGBge3J9CgojIG1lcmdpbmcgYW5udWFsIGluY29tZQpsY19kYXRhIDwtIGxjX2RhdGEgJT4lIG11dGF0ZSgKICAgIGFubnVhbF9pbmNfbWVyZ2VkID0gaWZlbHNlKGlzLm5hKGFubnVhbF9pbmNfam9pbnQpPT0gVFJVRSwgYW5udWFsX2luYyxhbm51YWxfaW5jX2pvaW50KSkgCgpsY19kYXRhIDwtIGxjX2RhdGEgJT4lIHNlbGVjdCgtYW5udWFsX2luYywtYW5udWFsX2luY19qb2ludCkKCgojIG1lcmdpbmcgZGVidCB0byBpbmNvbWUgcmF0aW8KbGNfZGF0YSA8LSBsY19kYXRhICU+JSBtdXRhdGUoCiAgICBkdGlfbWVyZ2VkID0gaWZlbHNlKGlzLm5hKGR0aV9qb2ludCk9PSBUUlVFLCBkdGksZHRpX2pvaW50KSkgCgpsY19kYXRhIDwtIGxjX2RhdGEgJT4lIHNlbGVjdCgtZHRpLC1kdGlfam9pbnQpCgpgYGAKClVwb24gcmV2aWV3aW5nIHRoZSBzdW1tYXJ5IGFnYWluLCBpdCBiZWNvbWVzIGFwcGFyZW50IHRoYXQgdGhlcmUgYXJlIG1lcmVseSA0NjAgam9pbnQgYXBwbGljYXRpb25zLCBjb25zdGl0dXRpbmcgYSBzbWFsbCBzdWJzZXQgd2l0aGluIHRoZSBleHRlbnNpdmUgZGF0YXNldCBvZiBhcm91bmQgODAwayByb3dzLiBUaHJvdWdoIGNvbnNvbGlkYXRpbmcgdGhlIGRlYnQtdG8taW5jb21lIHJhdGlvcyAoZHRpJ3MpLCB3ZSBjYW4gcGlucG9pbnQgdGhlIGRhdGEgcGVydGluZW50IHRvIG91ciByZXNlYXJjaCBvYmplY3RpdmVzLiBIZW5jZSwgaXQgaXMgYWR2aXNhYmxlIHRvIGVsaW1pbmF0ZSB0aGUgY29sdW1ucyB2ZXJpZmljYXRpb25fc3RhdHVzX2pvaW50IGFuZCBhcHBsaWNhdGlvbl90eXBlIHRvIHByZXZlbnQgaW50cm9kdWNpbmcgdW53YXJyYW50ZWQgdmFyaWFiaWxpdHkgaW50byBvdXIgYW5hbHlzaXMuCgpgYGB7cn0KdGFibGUobGNfZGF0YSR2ZXJpZmljYXRpb25fc3RhdHVzKQp0YWJsZShsY19kYXRhJHZlcmlmaWNhdGlvbl9zdGF0dXNfam9pbnQpCmBgYAoKYGBge3J9CmxjX2RhdGEkdmVyaWZpY2F0aW9uX3N0YXR1cyA8LSBhcy5udW1lcmljKGFzLmZhY3RvcihsY19kYXRhJHZlcmlmaWNhdGlvbl9zdGF0dXMpKQpsY19kYXRhIDwtIGxjX2RhdGEgJT4lIHNlbGVjdCgtdmVyaWZpY2F0aW9uX3N0YXR1c19qb2ludCwgLWFwcGxpY2F0aW9uX3R5cGUpCmBgYAoKCkxldCdzIGNoZWNsIGlmIG90aGVyIGlzIE5BIG9yIGEgcmVhbCB2YWx1ZSBmb3IgcHVycG9zZS4gSXQncyBhIHJlYWwgb25lLCBzbyB3ZSBkb24ndCBoYXZlIHRvIGhhbmRsZSBpdC4KYGBge3J9CmxjX2RhdGEkcHVycG9zZSA8LSBhcy5mYWN0b3IobGNfZGF0YSRwdXJwb3NlKQpnZ3Bsb3QoZGF0YSA9IGxjX2RhdGEsIG1hcHBpbmcgPSBhZXMoeD1pbnRfcmF0ZSx5PXB1cnBvc2UpKSArIGdlb21fYm94cGxvdCgpCmxjX2RhdGEkcHVycG9zZSA8LSBhcy5udW1lcmljKGxjX2RhdGEkcHVycG9zZSkKYGBgCkxldCdzIGhhdmUgYSBnbGFuY2UgdG8gdGhlIHN0YXRlIGFkZHJlc3M6CmBgYHtyfQp0YWJsZShsY19kYXRhJGFkZHJfc3RhdGUpCmxjX2RhdGEkYWRkcl9zdGF0ZSA8LSBhcy5mYWN0b3IobGNfZGF0YSRhZGRyX3N0YXRlKQpnZ3Bsb3QoZGF0YSA9IGxjX2RhdGEsIG1hcHBpbmcgPSBhZXMoeD1pbnRfcmF0ZSx5PWFkZHJfc3RhdGUpKSArIGdlb21fYm94cGxvdCgpCmxjX2RhdGEkYWRkcl9zdGF0ZSA8LSBhcy5udW1lcmljKGxjX2RhdGEkYWRkcl9zdGF0ZSkKYGBgClJlZ2FyZGluZyBkZWxpbnF1ZW5jeSBpbiB0aGUgbGFzdCAyIHllYXJzLCB0aGVyZSBhcmUgZmV3IE5BcyB0aGVuIHJlbW92ZSB0aGVtOgpgYGB7cn0KbGNfZGF0YSA8LSBsY19kYXRhICU+JSAKICAgIGZpbHRlcighKGlzLm5hKGRlbGlucV8yeXJzKSkpCmBgYAoKCmBgYHtyfQpsY19kYXRhIDwtIGxjX2RhdGEgJT4lCiAgbXV0YXRlKG10aHNfc2luY2VfZGVsaW5xX2NhdCA9IGlmZWxzZSgKICAgIGlzLm5hKG10aHNfc2luY2VfbGFzdF9kZWxpbnEpID09IFRSVUUsCiAgICAiTk9ORSIsCiAgICBpZmVsc2UoCiAgICAgIG10aHNfc2luY2VfbGFzdF9kZWxpbnEgPD0gMTIsCiAgICAgICJMZXNzXzFfWSIsCiAgICAgIGlmZWxzZSgKICAgICAgICBtdGhzX3NpbmNlX2xhc3RfZGVsaW5xIDw9IDI0LAogICAgICAgICJMZXNzXzJfWSIsCiAgICAgICAgaWZlbHNlKAogICAgICAgICAgbXRoc19zaW5jZV9sYXN0X2RlbGlucSA8PSAzNiwKICAgICAgICAgICJMZXNzXzNfWSIsCiAgICAgICAgICBpZmVsc2UobXRoc19zaW5jZV9sYXN0X2RlbGlucSA8PSA0OCwgIkxlc3NfNF9ZIiwgIk1vcmVfNF9ZIikKICAgICAgICApCiAgICAgICkKICAgICkKICApKSAlPiUgc2VsZWN0KC1tdGhzX3NpbmNlX2xhc3RfZGVsaW5xKQogICAgICAgICAgCmxjX2RhdGEkbXRoc19zaW5jZV9kZWxpbnFfY2F0IDwtIGFzLmZhY3RvcihsY19kYXRhJG10aHNfc2luY2VfZGVsaW5xX2NhdCkKZ2dwbG90KGRhdGEgPSBsY19kYXRhLCBtYXBwaW5nID0gYWVzKHg9aW50X3JhdGUseT1tdGhzX3NpbmNlX2RlbGlucV9jYXQpKStnZW9tX2JveHBsb3QoKQpsY19kYXRhJG10aHNfc2luY2VfZGVsaW5xX2NhdCA8LSBhcy5udW1lcmljKGxjX2RhdGEkbXRoc19zaW5jZV9kZWxpbnFfY2F0KQpgYGAKCmBgYHtyfQpsY19kYXRhIDwtIGxjX2RhdGEgJT4lCiAgbXV0YXRlKG10aHNfc2luY2VfbGFzdF9yZWNvcmRfY2F0ID0gaWZlbHNlKAogICAgaXMubmEobXRoc19zaW5jZV9sYXN0X3JlY29yZCkgPT0gVFJVRSwKICAgICJOT05FIiwKICAgIGlmZWxzZSgKICAgICAgbXRoc19zaW5jZV9sYXN0X3JlY29yZCA8PSAxMiwKICAgICAgIkxlc3NfMV9ZIiwKICAgICAgaWZlbHNlKAogICAgICAgIG10aHNfc2luY2VfbGFzdF9yZWNvcmQgPD0gMjQsCiAgICAgICAgIkxlc3NfMl9ZIiwKICAgICAgICBpZmVsc2UoCiAgICAgICAgICBtdGhzX3NpbmNlX2xhc3RfcmVjb3JkIDw9IDM2LAogICAgICAgICAgIkxlc3NfM19ZIiwKICAgICAgICAgIGlmZWxzZShtdGhzX3NpbmNlX2xhc3RfcmVjb3JkIDw9IDQ4LCAiTGVzc180X1kiLCAiTW9yZV80X1kiKQogICAgICAgICkKICAgICAgKQogICAgKQogICkpICU+JSBzZWxlY3QoLW10aHNfc2luY2VfbGFzdF9yZWNvcmQpCgpsY19kYXRhJG10aHNfc2luY2VfbGFzdF9yZWNvcmRfY2F0IDwtIGFzLmZhY3RvcihsY19kYXRhJG10aHNfc2luY2VfbGFzdF9yZWNvcmRfY2F0KQpnZ3Bsb3QoZGF0YSA9IGxjX2RhdGEsIG1hcHBpbmcgPSBhZXMoeD1pbnRfcmF0ZSx5PW10aHNfc2luY2VfbGFzdF9yZWNvcmRfY2F0KSkrZ2VvbV9ib3hwbG90KCkKbGNfZGF0YSRtdGhzX3NpbmNlX2xhc3RfcmVjb3JkX2NhdCA8LSBhcy5udW1lcmljKGxjX2RhdGEkbXRoc19zaW5jZV9sYXN0X3JlY29yZF9jYXQpCmBgYAoKYGBge3J9CmxjX2RhdGEgPC1sY19kYXRhICU+JSAKICBtdXRhdGUobXRoc19zaW5jZV9sYXN0X21ham9yX2Rlcm9nX2NhdCA9ICBpZmVsc2UoCiAgICBpcy5uYShtdGhzX3NpbmNlX2xhc3RfbWFqb3JfZGVyb2cpID09IFRSVUUsCiAgICAiTk9ORSIsCiAgICBpZmVsc2UoCiAgICAgIG10aHNfc2luY2VfbGFzdF9tYWpvcl9kZXJvZyA8PSAxMiwKICAgICAgIkxlc3NfMV9ZIiwKICAgICAgaWZlbHNlKAogICAgICAgIG10aHNfc2luY2VfbGFzdF9tYWpvcl9kZXJvZyA8PSAyNCwKICAgICAgICAiTGVzc18yX1kiLAogICAgICAgIGlmZWxzZSgKICAgICAgICAgIG10aHNfc2luY2VfbGFzdF9tYWpvcl9kZXJvZyA8PSAzNiwKICAgICAgICAgICJMZXNzXzNfWSIsCiAgICAgICAgICBpZmVsc2UobXRoc19zaW5jZV9sYXN0X21ham9yX2Rlcm9nIDw9IDQ4LCAiTGVzc180X1kiLCAiTW9yZV80X1kiKQogICAgICAgICkKICAgICAgKQogICAgKQogICkpICU+JSBzZWxlY3QoLW10aHNfc2luY2VfbGFzdF9tYWpvcl9kZXJvZykKCmxjX2RhdGEkbXRoc19zaW5jZV9sYXN0X21ham9yX2Rlcm9nX2NhdCA8LSBhcy5mYWN0b3IobGNfZGF0YSRtdGhzX3NpbmNlX2xhc3RfbWFqb3JfZGVyb2dfY2F0KQpnZ3Bsb3QoZGF0YSA9IGxjX2RhdGEsIG1hcHBpbmcgPSBhZXMoeD1pbnRfcmF0ZSx5PW10aHNfc2luY2VfbGFzdF9tYWpvcl9kZXJvZ19jYXQpKStnZW9tX2JveHBsb3QoKQpsY19kYXRhJG10aHNfc2luY2VfbGFzdF9tYWpvcl9kZXJvZ19jYXQgPC0gYXMubnVtZXJpYyhsY19kYXRhJG10aHNfc2luY2VfbGFzdF9tYWpvcl9kZXJvZ19jYXQpCgpgYGAKCmBgYHtyfQpsY19kYXRhJGluaXRpYWxfbGlzdF9zdGF0dXMgPC0gYXMuZmFjdG9yKGxjX2RhdGEkaW5pdGlhbF9saXN0X3N0YXR1cykKZ2dwbG90KGRhdGEgPSBsY19kYXRhLCBtYXBwaW5nID0gYWVzKHg9aW50X3JhdGUseT1pbml0aWFsX2xpc3Rfc3RhdHVzKSkrZ2VvbV9ib3hwbG90KCkKbGNfZGF0YSRpbml0aWFsX2xpc3Rfc3RhdHVzIDwtIGFzLm51bWVyaWMobGNfZGF0YSRpbml0aWFsX2xpc3Rfc3RhdHVzKQpgYGAKCkxldCdzIGNoZWNrIHdoaWNoIGNvbHVtbnMgc3RpbGwgaGF2ZSBudWxsIHZhbHVlcwpgYGB7cn0KY29sU3Vtcyhpcy5uYShsY19kYXRhKSkKYGBgClRoZSBjb2x1bW5zICoqcmV2b2xfYmFsKiogYW5kICoqcmV2b2xfdXRpbCoqIGNvbnRhaW4gb25seSBmZXcgTkEgdmFsdWVzLCB0aG9zZSB2YWx1ZXMgY2FuJ3QgYmUgcmVwbGFjZWQgd2l0aCAwLCB0aGVuIHdlIGZpbHRlciB0aGUgdmFsdWVzIHdoaWNoIGFyZSBub3QgTkEKYGBge3J9CmxjX2RhdGEgPC0gbGNfZGF0YSAlPiUgCiAgICBmaWx0ZXIoIShpcy5uYShyZXZvbF9iYWwpKSkgJT4lIAogICAgICAgIGZpbHRlcighKGlzLm5hKHJldm9sX3V0aWwpKSkKYGBgCgoKTGV0J3MgY2hlY2sgd2hpY2ggY29sdW1ucyBzdGlsbCBoYXZlIG51bGwgdmFsdWVzCmBgYHtyfQpuYW1lcyh3aGljaChjb2xTdW1zKGlzLm5hKGxjX2RhdGEpKSA+IDApKQpgYGAKClJlcGxhY2UgbnVsbCB2YWx1ZXMgd2l0aCAwIHdoZXJlIGlzIHBvc3NpYmxlCmBgYHtyfQpsY19kYXRhIDwtCiAgbGNfZGF0YSAlPiUKICBtdXRhdGUob3Blbl9hY2NfNm0gPSBpZmVsc2UoaXMubmEob3Blbl9hY2NfNm0pID09IFRSVUUsIDAsIG9wZW5fYWNjXzZtKSkgJT4lCiAgbXV0YXRlKHRvdF9jdXJfYmFsID0gaWZlbHNlKGlzLm5hKHRvdF9jdXJfYmFsKSA9PSBUUlVFLCAwLCB0b3RfY3VyX2JhbCkpICU+JQogIG11dGF0ZShvcGVuX2lsXzZtID0gaWZlbHNlKGlzLm5hKG9wZW5faWxfNm0pID09IFRSVUUsIDAsIG9wZW5faWxfNm0pKSAlPiUKICBtdXRhdGUob3Blbl9pbF8xMm0gPSBpZmVsc2UoaXMubmEob3Blbl9pbF8xMm0pID09IFRSVUUsIDAsIG9wZW5faWxfMTJtKSkgJT4lCiAgbXV0YXRlKG9wZW5faWxfMjRtID0gaWZlbHNlKGlzLm5hKG9wZW5faWxfMjRtKSA9PSBUUlVFLCAwLCBvcGVuX2lsXzI0bSkpICU+JQogIG11dGF0ZShtdGhzX3NpbmNlX3JjbnRfaWwgPSBpZmVsc2UoaXMubmEobXRoc19zaW5jZV9yY250X2lsKSA9PSBUUlVFLCAwLCBtdGhzX3NpbmNlX3JjbnRfaWwpKSAlPiUKICBtdXRhdGUodG90YWxfYmFsX2lsID0gaWZlbHNlKGlzLm5hKHRvdGFsX2JhbF9pbCkgPT0gVFJVRSwgMCwgdG90YWxfYmFsX2lsKSkgJT4lCiAgbXV0YXRlKGlsX3V0aWwgPSBpZmVsc2UoaXMubmEoaWxfdXRpbCkgPT0gVFJVRSwgMCwgaWxfdXRpbCkpICU+JQogIG11dGF0ZShvcGVuX3J2XzEybSA9IGlmZWxzZShpcy5uYShvcGVuX3J2XzEybSkgPT0gVFJVRSwgMCwgb3Blbl9ydl8xMm0pKSAlPiUKICBtdXRhdGUodG90YWxfcmV2X2hpX2xpbSA9IGlmZWxzZShpcy5uYSh0b3RhbF9yZXZfaGlfbGltKSA9PSBUUlVFLCAwLCB0b3RhbF9yZXZfaGlfbGltKSkgJT4lCiAgbXV0YXRlKG1heF9iYWxfYmMgPSBpZmVsc2UoaXMubmEobWF4X2JhbF9iYykgPT0gVFJVRSwgMCwgbWF4X2JhbF9iYykpICU+JQogIG11dGF0ZShhbGxfdXRpbCA9IGlmZWxzZShpcy5uYShhbGxfdXRpbCkgPT0gVFJVRSwgMCwgYWxsX3V0aWwpKSAlPiUKICBtdXRhdGUoaW5xX2ZpID0gaWZlbHNlKGlzLm5hKGlucV9maSkgPT0gVFJVRSwgMCwgaW5xX2ZpKSkgJT4lCiAgbXV0YXRlKHRvdGFsX2N1X3RsID0gaWZlbHNlKGlzLm5hKHRvdGFsX2N1X3RsKSA9PSBUUlVFLCAwLCB0b3RhbF9jdV90bCkpICU+JQogIG11dGF0ZShpbnFfbGFzdF8xMm0gPSBpZmVsc2UoaXMubmEoaW5xX2xhc3RfMTJtKSA9PSBUUlVFLCAwLCBpbnFfbGFzdF8xMm0pKSAlPiUKICBtdXRhdGUob3Blbl9ydl8yNG0gPSBpZmVsc2UoaXMubmEob3Blbl9ydl8yNG0pID09IFRSVUUsIDAsIG9wZW5fcnZfMjRtKSkgJT4lCiAgbXV0YXRlKHRvdF9jb2xsX2FtdCA9IGlmZWxzZShpcy5uYSh0b3RfY29sbF9hbXQpPT0gVFJVRSwwLCB0b3RfY29sbF9hbXQpKSAlPiUKICBtdXRhdGUoY29sbGVjdGlvbnNfMTJfbXRoc19leF9tZWQgPSBpZmVsc2UoaXMubmEoY29sbGVjdGlvbnNfMTJfbXRoc19leF9tZWQpPT0gVFJVRSwwLCBjb2xsZWN0aW9uc18xMl9tdGhzX2V4X21lZCkpCmBgYAoKKiplYXJsaWVzdF9jcl9saW5lKiogY29udGFpbnMgdGhlIG1vbnRoIHRoZSBib3Jyb3dlcidzIGVhcmxpZXN0IHJlcG9ydGVkIGNyZWRpdCBsaW5lIHdhcyBvcGVuZWQuCkV2ZW4gaWYgdGhpcyBkYXRlIGNvbnNpc3RzIG9ubHkgb24gbW9udGggYW5kIHllYXIsIHN0aWxsIHRoZXJlIGFyZSB0b28gbWFueSB1bmlxdWUgdmFsdWVzLgpXZSBjb3VsZCB0cmFuc2Zvcm0gdGhlIGRhdGVzIGluIHRvIGEgbnVtZXJpY2FsIHZhbHVlLCBieSBjb252ZXJ0aW5nIHRoZW0gZnJvbSBkYXRlIGludG8gVW5peCBUaW1lLgpUaGlzIHVuaXQgbWVhc3VyZXMgdGltZSBieSB0aGUgbnVtYmVyIG9mIHNlY29uZHMgdGhhdCBoYXZlIGVsYXBzZWQgc2luY2UgMDA6MDA6MDAgVVRDIG9uIDEgSmFudWFyeSAxOTcwLgpTaW5jZSB0aGlzIGNvbHVtbiBkb2Vzbid0IGNvbnRhaW4gdGhlIGRheSBudW1iZXIsIHdlIHRha2UgYXMgYSByZWZlcmVuY2UgdGhlIGZpcnN0IGRheSBvZiB0aGUgbW9udGguCgpgYGB7cn0KbGNfZGF0YSA8LSBsY19kYXRhICU+JSAKICAgIGZpbHRlcighKGlzLm5hKGVhcmxpZXN0X2NyX2xpbmUpKSkKCiMgZnVuY3Rpb24gdG8gcmVwbGFjZSBkYXRlcyB3aXRoIHVuaXggdGltZQp0b191bml4X3RpbWUgPC0gZnVuY3Rpb24oZGF0ZSkgewogIHRtcCA8LSBwYXN0ZSgiMDEiLCBkYXRlLCBzZXA9Ii0iKQogIHJldHVybiAoYXMubnVtZXJpYyhhcy5QT1NJWGN0KHRtcCwgZm9ybWF0PSIlZC0lYi0lWSIsIHR6PSJVVEMiKSkpCn0KCiMgbWFwIGRhdGVzIHRvIHVuaXggdGltZQpsY19kYXRhJGVhcmxpZXN0X2NyX2xpbmUgPC0gYXBwbHkobGNfZGF0YSwgMSwgZnVuY3Rpb24ocm93KSB0b191bml4X3RpbWUocm93WyJlYXJsaWVzdF9jcl9saW5lIl0pKQoKIyBzdGFuZGFyZGl6ZSB0aGVtCiNsY19kYXRhJGVhcmxpZXN0X2NyX2xpbmUgPC0gc2NhbGUobGNfZGF0YSRlYXJsaWVzdF9jcl9saW5lKQpgYGAKCmBgYHtyfQpzdW1tYXJ5KGxjX2RhdGEpCmBgYAoKCmBgYHtyfQojcm91bmQoY29yKGxjX2RhdGEpLDIpCmBgYAoKYGBge3J9CgojIFRPRE86IChwYXJ0ZSB2ZWNjaGlhKSwgc3BsaXQgODAvMjAgZSBsaW5lYXIgcmVncmVzc2lvbi4uLgojIENyZWF0ZSBpbmRpY2VzIGZvciBzcGxpdHRpbmcgKDgwJSB0cmFpbiwgMjAlIHRlc3QpCnRyYWluX2luZGljZXMgPC0gY3JlYXRlRGF0YVBhcnRpdGlvbihsY19kYXRhJGludF9yYXRlLCBwID0gMC44LCBsaXN0ID0gRkFMU0UpCgojIENyZWF0ZSB0cmFpbmluZyBhbmQgdGVzdGluZyBkYXRhc2V0cwp0cmFpbl9kYXRhIDwtIGxjX2RhdGFbdHJhaW5faW5kaWNlcywgXQp0ZXN0X2RhdGEgPC0gbGNfZGF0YVstdHJhaW5faW5kaWNlcywgXQoKIyMjIyBMaW5lYXIgUmVncmVzc2lvbiAjIyMjCiNsbS5maXQgPC0gbG0oaW50X3JhdGUgfiAuLCBkYXRhID0gdHJhaW5fZGF0YSkKCiMgVE9ETzogY2hlY2sgY29sbGluZWFyaXR5IGFuZCBtdWx0aWNvbGxpbmVhcml0eQojdmlmKGxtLmZpdCkgIyB0aGVyZSBpcyBtdWx0aWNvbGxpbmVhcml0eQojY29yKGxjX2RhdGEpIAoKIyBNYWtlIHByZWRpY3Rpb25zIG9uIHRyYWluaW5nIGFuZCB0ZXN0aW5nIGRhdGEKI3RyYWluX3ByZWRpY3Rpb25zIDwtIHByZWRpY3QobG0uZml0LCBuZXdkYXRhID0gdHJhaW5fZGF0YSkKI3Rlc3RfcHJlZGljdGlvbnMgPC0gcHJlZGljdChsbS5maXQsIG5ld2RhdGEgPSB0ZXN0X2RhdGEpCgojIEV2YWx1YXRlIG1vZGVsIHBlcmZvcm1hbmNlIG9uIHRyYWluaW5nIGRhdGEKI3RyYWluX3Jtc2UgPC0gc3FydChtZWFuKCh0cmFpbl9wcmVkaWN0aW9ucyAtIHRyYWluX2RhdGEkaW50X3JhdGUpXjIpKQojdHJhaW5fcl9zcXVhcmVkIDwtIHN1bW1hcnkobG0uZml0KSRyLnNxdWFyZWQKCiMgRXZhbHVhdGUgbW9kZWwgcGVyZm9ybWFuY2Ugb24gdGVzdGluZyBkYXRhCiN0ZXN0X3Jtc2UgPC0gc3FydChtZWFuKCh0ZXN0X3ByZWRpY3Rpb25zIC0gdGVzdF9kYXRhJGludF9yYXRlKV4yKSkKI3Rlc3Rfcl9zcXVhcmVkIDwtIHN1bW1hcnkobG0uZml0LCB0ZXN0X2RhdGEpJHIuc3F1YXJlZAoKIyBQcmludCBldmFsdWF0aW9uIG1ldHJpY3MKI2NhdCgiVHJhaW5pbmcgUk1TRToiLCB0cmFpbl9ybXNlLCAiXG4iKQojY2F0KCJUcmFpbmluZyBSLXNxdWFyZWQ6IiwgdHJhaW5fcl9zcXVhcmVkLCAiXG4iKQojcm1zZSA8LSBzcXJ0KG1lYW4obG0uZml0JHJlc2lkdWFsc14yKSkKI3ByaW50KHJtc2UpCmBgYAoKYGBge3J9CiMgMSUgb2YgdGhlIHRvdGFsIHJvd3MKc2FtcGxlX3RyYWluX3NpemUgPC0gZmxvb3IoMC4wMSAqIG5yb3codHJhaW5fZGF0YSkpCnNhbXBsZV90ZXN0X3NpemUgPC0gZmxvb3IoMC4wMSAqIG5yb3codGVzdF9kYXRhKSkKCiMgUmFuZG9tbHkgc2VsZWN0IDElIG9mIHRoZSByb3dzCnNhbXBsZWRfdHJhaW5fZGF0YSA8LSB0cmFpbl9kYXRhW3NhbXBsZShucm93KHRyYWluX2RhdGEpLCBzaXplID0gc2FtcGxlX3RyYWluX3NpemUsIHJlcGxhY2UgPSBGQUxTRSksIF0Kc2FtcGxlZF90ZXN0X2RhdGEgPC0gdGVzdF9kYXRhW3NhbXBsZShucm93KHRlc3RfZGF0YSksIHNpemUgPSBzYW1wbGVfdGVzdF9zaXplLCByZXBsYWNlID0gRkFMU0UpLCBdCgpzYW1wbGVkX3RyYWluX2RhdGEgPC0gdHJhaW5fZGF0YQpzYW1wbGVkX3Rlc3RfZGF0YSA8LSB0ZXN0X2RhdGEKCiMjIyMgTGluZWFyIFJlZ3Jlc3Npb24gIyMjIwoKbG0uZml0IDwtIGxtKGludF9yYXRlIH4gLiwgZGF0YSA9IHNhbXBsZWRfdHJhaW5fZGF0YSkKCiMgTWFrZSBwcmVkaWN0aW9ucyBvbiB0aGUgdHJhaW5pbmcgYW5kIHRlc3RpbmcgZGF0YQpsbS50cmFpbl9wcmVkaWN0aW9ucyA8LSBwcmVkaWN0KGxtLmZpdCwgbmV3ZGF0YSA9IHNhbXBsZWRfdHJhaW5fZGF0YSkKbG0udGVzdF9wcmVkaWN0aW9ucyA8LSBwcmVkaWN0KGxtLmZpdCwgbmV3ZGF0YSA9IHNhbXBsZWRfdGVzdF9kYXRhKQoKIyBDYWxjdWxhdGUgTWVhbiBTcXVhcmVkIEVycm9yIChNU0UpIGZvciB0cmFpbmluZyBhbmQgdGVzdGluZwpsbS50cmFpbl9tc2UgPC0gbWVhbigobG0udHJhaW5fcHJlZGljdGlvbnMgLSBzYW1wbGVkX3RyYWluX2RhdGEkaW50X3JhdGUpXjIpCmxtLnRlc3RfbXNlIDwtIG1lYW4oKGxtLnRlc3RfcHJlZGljdGlvbnMgLSBzYW1wbGVkX3Rlc3RfZGF0YSRpbnRfcmF0ZSleMikKCiMgQ2FsY3VsYXRlIFJvb3QgTWVhbiBTcXVhcmVkIEVycm9yIChSTVNFKSBmb3IgdHJhaW5pbmcgYW5kIHRlc3RpbmcKbG0udHJhaW5fcm1zZSA8LSBzcXJ0KGxtLnRyYWluX21zZSkKbG0udGVzdF9ybXNlIDwtIHNxcnQobG0udGVzdF9tc2UpCgojIENhbGN1bGF0ZSBNZWFuIEFic29sdXRlIEVycm9yIChNQUUpIGZvciB0cmFpbmluZyBhbmQgdGVzdGluZwpsbS50cmFpbl9tYWUgPC0gbWVhbihhYnMobG0udHJhaW5fcHJlZGljdGlvbnMgLSBzYW1wbGVkX3RyYWluX2RhdGEkaW50X3JhdGUpKQpsbS50ZXN0X21hZSA8LSBtZWFuKGFicyhsbS50ZXN0X3ByZWRpY3Rpb25zIC0gc2FtcGxlZF90ZXN0X2RhdGEkaW50X3JhdGUpKQoKIyBDYWxjdWxhdGUgUi1zcXVhcmVkIChSwrIpIGZvciB0cmFpbmluZyBhbmQgdGVzdGluZwpsbS50cmFpbl9yMiA8LSAxIC0gKHN1bSgoc2FtcGxlZF90cmFpbl9kYXRhJGludF9yYXRlIC0gbG0udHJhaW5fcHJlZGljdGlvbnMpXjIpIC8gc3VtKChzYW1wbGVkX3RyYWluX2RhdGEkaW50X3JhdGUgLSBtZWFuKHNhbXBsZWRfdHJhaW5fZGF0YSRpbnRfcmF0ZSkpXjIpKQpsbS50ZXN0X3IyIDwtIDEgLSAoc3VtKChzYW1wbGVkX3Rlc3RfZGF0YSRpbnRfcmF0ZSAtIGxtLnRlc3RfcHJlZGljdGlvbnMpXjIpIC8gc3VtKChzYW1wbGVkX3Rlc3RfZGF0YSRpbnRfcmF0ZSAtIG1lYW4oc2FtcGxlZF90ZXN0X2RhdGEkaW50X3JhdGUpKV4yKSkKCiMgRGlzcGxheSB0aGUgbWV0cmljcwpjYXQoIlRyYWluaW5nIE1TRToiLCBsbS50cmFpbl9tc2UsICJcbiIpCmNhdCgiVGVzdGluZyBNU0U6IiwgbG0udGVzdF9tc2UsICJcbiIpCmNhdCgiVHJhaW5pbmcgUk1TRToiLCBsbS50cmFpbl9ybXNlLCAiXG4iKQpjYXQoIlRlc3RpbmcgUk1TRToiLCBsbS50ZXN0X3Jtc2UsICJcbiIpCmNhdCgiVHJhaW5pbmcgTUFFOiIsIGxtLnRyYWluX21hZSwgIlxuIikKY2F0KCJUZXN0aW5nIE1BRToiLCBsbS50ZXN0X21hZSwgIlxuIikKY2F0KCJUcmFpbmluZyBSLXNxdWFyZWQgKFLCsik6IiwgbG0udHJhaW5fcjIsICJcbiIpCmNhdCgiVGVzdGluZyBSLXNxdWFyZWQgKFLCsik6IiwgbG0udGVzdF9yMiwgIlxuIikKCiMjIyMgTGluZWFyIFJlZ3Jlc2lvbiBhcHBseWluZyBDcm9zcyBWYWxpZGF0aW9uIHdpdGggaz0yIHRvIGs9MTAgICMjIyMKCgojIEFzc3VtaW5nICdzYW1wbGVkX3RyYWluX2RhdGEnIGlzIHlvdXIgdHJhaW5pbmcgZGF0YSBzZXQKCiMgSW5pdGlhbGl6ZSBsaXN0cyB0byBzdG9yZSBtb2RlbHMgYW5kIHRoZWlyIHJlc3VsdHMKbW9kZWxzIDwtIGxpc3QoKQpyZXN1bHRzIDwtIGRhdGEuZnJhbWUoKQoKIyBEZWZpbmUgdGhlIG51bWJlciBvZiBmb2xkcyBmb3IgY3Jvc3MtdmFsaWRhdGlvbgpudW1fZm9sZHMgPC0gMTAKZm9sZHMgPC0gY3JlYXRlRm9sZHMoc2FtcGxlZF90cmFpbl9kYXRhJGludF9yYXRlLCBrID0gbnVtX2ZvbGRzLCBsaXN0ID0gVFJVRSkKCiMgUGVyZm9ybSBrLWZvbGQgY3Jvc3MtdmFsaWRhdGlvbgpmb3IoaSBpbiBzZXFfYWxvbmcoZm9sZHMpKSB7CiAgIyBTcGxpdCB0aGUgZGF0YSBpbnRvIHRyYWluaW5nIGFuZCB0ZXN0aW5nIGZvciB0aGUgY3VycmVudCBmb2xkCiAgdHJhaW5faW5kaWNlcyA8LSBmb2xkc1tbaV1dCiAgdGVzdF9pbmRpY2VzIDwtIHNldGRpZmYoc2VxX2xlbihucm93KHNhbXBsZWRfdHJhaW5fZGF0YSkpLCB0cmFpbl9pbmRpY2VzKQogIAogIHRyYWluX2RhdGFfZm9sZCA8LSBzYW1wbGVkX3RyYWluX2RhdGFbdHJhaW5faW5kaWNlcywgXQogIHRlc3RfZGF0YV9mb2xkIDwtIHNhbXBsZWRfdHJhaW5fZGF0YVt0ZXN0X2luZGljZXMsIF0KICAKICAjIEZpdCB0aGUgbW9kZWwgb24gdGhlIHRyYWluaW5nIGZvbGQKICBsbV9tb2RlbCA8LSBsbShpbnRfcmF0ZSB+IC4sIGRhdGEgPSB0cmFpbl9kYXRhX2ZvbGQpCiAgbW9kZWxzW1tpXV0gPC0gbG1fbW9kZWwgICMgU3RvcmUgdGhlIG1vZGVsCiAgCiAgIyBNYWtlIHByZWRpY3Rpb25zIG9uIHRoZSB0cmFpbmluZyBhbmQgdGVzdGluZyBmb2xkCiAgdHJhaW5fcHJlZGljdGlvbnMgPC0gcHJlZGljdChsbV9tb2RlbCwgbmV3ZGF0YSA9IHRyYWluX2RhdGFfZm9sZCkKICB0ZXN0X3ByZWRpY3Rpb25zIDwtIHByZWRpY3QobG1fbW9kZWwsIG5ld2RhdGEgPSB0ZXN0X2RhdGFfZm9sZCkKICAKICAjIENhbGN1bGF0ZSBtZXRyaWNzIGZvciB0cmFpbmluZyBmb2xkCiAgdHJhaW5fbXNlIDwtIG1lYW4oKHRyYWluX3ByZWRpY3Rpb25zIC0gdHJhaW5fZGF0YV9mb2xkJGludF9yYXRlKV4yKQogIHRyYWluX3Jtc2UgPC0gc3FydCh0cmFpbl9tc2UpCiAgdHJhaW5fbWFlIDwtIG1lYW4oYWJzKHRyYWluX3ByZWRpY3Rpb25zIC0gdHJhaW5fZGF0YV9mb2xkJGludF9yYXRlKSkKICB0cmFpbl9yMiA8LSBzdW1tYXJ5KGxtX21vZGVsKSRyLnNxdWFyZWQKICAKICAjIENhbGN1bGF0ZSBtZXRyaWNzIGZvciB0ZXN0aW5nIGZvbGQKICB0ZXN0X21zZSA8LSBtZWFuKCh0ZXN0X3ByZWRpY3Rpb25zIC0gdGVzdF9kYXRhX2ZvbGQkaW50X3JhdGUpXjIpCiAgdGVzdF9ybXNlIDwtIHNxcnQodGVzdF9tc2UpCiAgdGVzdF9tYWUgPC0gbWVhbihhYnModGVzdF9wcmVkaWN0aW9ucyAtIHRlc3RfZGF0YV9mb2xkJGludF9yYXRlKSkKICB0ZXN0X3IyIDwtIDEgLSAoc3VtKCh0ZXN0X2RhdGFfZm9sZCRpbnRfcmF0ZSAtIHRlc3RfcHJlZGljdGlvbnMpXjIpIC8gc3VtKCh0ZXN0X2RhdGFfZm9sZCRpbnRfcmF0ZSAtIG1lYW4odGVzdF9kYXRhX2ZvbGQkaW50X3JhdGUpKV4yKSkKICAKICAjIFN0b3JlIG1ldHJpY3MgaW4gdGhlIHJlc3VsdHMgZGF0YWZyYW1lCiAgcmVzdWx0cyA8LSByYmluZChyZXN1bHRzLCBkYXRhLmZyYW1lKAogICAgRm9sZCA9IGksCiAgICBUcmFpbl9NU0UgPSB0cmFpbl9tc2UsIFRlc3RfTVNFID0gdGVzdF9tc2UsCiAgICBUcmFpbl9STVNFID0gdHJhaW5fcm1zZSwgVGVzdF9STVNFID0gdGVzdF9ybXNlLAogICAgVHJhaW5fTUFFID0gdHJhaW5fbWFlLCBUZXN0X01BRSA9IHRlc3RfbWFlLAogICAgVHJhaW5fUjIgPSB0cmFpbl9yMiwgVGVzdF9SMiA9IHRlc3RfcjIKICApKQp9CgojIERpc3BsYXkgdGhlIG1vZGVscyBhbmQgdGhlaXIgbWV0cmljcwpwcmludChtb2RlbHMpCnByaW50KHJlc3VsdHMpCgoKIyMjIyBEZWNpc2lvbiBUcmVlcyAjIyMjCgojIEVycm9yIGluIHRyZWU6ICJmYWN0b3IgcHJlZGljdG9ycyBtdXN0IGhhdmUgYXQgbW9zdCAzMiBsZXZlbHMiIGlzIHRocm93bi4KIyBCYXNpY2FsbHksIGl0IGJlY29tZXMgY29tcHV0YXRpb25hbGx5IGV4cGVuc2l2ZSB0byBjcmVhdGUgc28gbWFueSBzcGxpdHMgaW4geW91ciBkYXRhLCBzaW5jZSB5b3UgYXJlIHNlbGVjdGluZyB0aGUgYmVzdCBzcGxpdCBvdXQgb2YgYWxsIDJeMzIgKGFwcHJveCkgcG9zc2libGUgc3BsaXRzLgoKCiMgRml0IGEgZGVjaXNpb24gdHJlZSBtb2RlbCBvbiB0aGUgdHJhaW5pbmcgZGF0YQojdG0gPC0gdHJlZShpbnRfcmF0ZSB+IC4sIGRhdGEgPSBzYW1wbGVkX3RyYWluX2RhdGEpCgojIE1ha2UgcHJlZGljdGlvbnMgb24gdGhlIHRyYWluaW5nIGFuZCB0ZXN0aW5nIGRhdGEKI3RtLnRyYWluX3ByZWRpY3Rpb25zIDwtIHByZWRpY3QodG0sIG5ld2RhdGEgPSBzYW1wbGVkX3RyYWluX2RhdGEpCiN0bS50ZXN0X3ByZWRpY3Rpb25zIDwtIHByZWRpY3QodG0sIG5ld2RhdGEgPSBzYW1wbGVkX3Rlc3RfZGF0YSkKCiMgQ2FsY3VsYXRlIE1lYW4gU3F1YXJlZCBFcnJvciAoTVNFKSBmb3IgdHJhaW5pbmcgYW5kIHRlc3RpbmcKI3RtLnRyYWluX21zZSA8LSBtZWFuKCh0bS50cmFpbl9wcmVkaWN0aW9ucyAtIHNhbXBsZWRfdHJhaW5fZGF0YSRpbnRfcmF0ZSleMikKI3RtLnRlc3RfbXNlIDwtIG1lYW4oKHRtLnRlc3RfcHJlZGljdGlvbnMgLSBzYW1wbGVkX3Rlc3RfZGF0YSRpbnRfcmF0ZSleMikKCiMgQ2FsY3VsYXRlIFJvb3QgTWVhbiBTcXVhcmVkIEVycm9yIChSTVNFKSBmb3IgdHJhaW5pbmcgYW5kIHRlc3RpbmcKI3RtLnRyYWluX3Jtc2UgPC0gc3FydCh0bS50cmFpbl9tc2UpCiN0bS50ZXN0X3Jtc2UgPC0gc3FydCh0bS50ZXN0X21zZSkKCiMgQ2FsY3VsYXRlIE1lYW4gQWJzb2x1dGUgRXJyb3IgKE1BRSkgZm9yIHRyYWluaW5nIGFuZCB0ZXN0aW5nCiN0bS50cmFpbl9tYWUgPC0gbWVhbihhYnModG0udHJhaW5fcHJlZGljdGlvbnMgLSBzYW1wbGVkX3RyYWluX2RhdGEkaW50X3JhdGUpKQojdG0udGVzdF9tYWUgPC0gbWVhbihhYnModG0udGVzdF9wcmVkaWN0aW9ucyAtIHNhbXBsZWRfdGVzdF9kYXRhJGludF9yYXRlKSkKCiMgQ2FsY3VsYXRlIFItc3F1YXJlZCAoUsKyKSBmb3IgdHJhaW5pbmcgYW5kIHRlc3RpbmcKI3RtLnRyYWluX3IyIDwtIDEgLSAoc3VtKChzYW1wbGVkX3RyYWluX2RhdGEkaW50X3JhdGUgLSB0bS50cmFpbl9wcmVkaWN0aW9ucyleMikgLyBzdW0oKHNhbXBsZWRfdHJhaW5fZGF0YSRpbnRfcmF0ZSAtIG1lYW4oc2FtcGxlZF90cmFpbl9kYXRhJGludF9yYXRlKSleMikpCiN0bS50ZXN0X3IyIDwtIDEgLSAoc3VtKChzYW1wbGVkX3Rlc3RfZGF0YSRpbnRfcmF0ZSAtIHRtLnRlc3RfcHJlZGljdGlvbnMpXjIpIC8gc3VtKChzYW1wbGVkX3Rlc3RfZGF0YSRpbnRfcmF0ZSAtIG1lYW4oc2FtcGxlZF90ZXN0X2RhdGEkaW50X3JhdGUpKV4yKSkKCiMgRGlzcGxheSB0aGUgbWV0cmljcwojY2F0KCJUcmFpbmluZyBNU0U6IiwgdG0udHJhaW5fbXNlLCAiXG4iKQojY2F0KCJUZXN0aW5nIE1TRToiLCB0bS50ZXN0X21zZSwgIlxuIikKI2NhdCgiVHJhaW5pbmcgUk1TRToiLCB0bS50cmFpbl9ybXNlLCAiXG4iKQojY2F0KCJUZXN0aW5nIFJNU0U6IiwgdG0udGVzdF9ybXNlLCAiXG4iKQojY2F0KCJUcmFpbmluZyBNQUU6IiwgdG0udHJhaW5fbWFlLCAiXG4iKQojY2F0KCJUZXN0aW5nIE1BRToiLCB0bS50ZXN0X21hZSwgIlxuIikKI2NhdCgiVHJhaW5pbmcgUi1zcXVhcmVkIChSwrIpOiIsIHRtLnRyYWluX3IyLCAiXG4iKQojY2F0KCJUZXN0aW5nIFItc3F1YXJlZCAoUsKyKToiLCB0bS50ZXN0X3IyLCAiXG4iKQoKIyMjIyBSYW5kb20gRm9yZXN0ICMjIyMKCiMgVHJhaW4gYSBSYW5kb20gRm9yZXN0IG1vZGVsCnJmIDwtIHJhbmdlcihmb3JtdWxhID0gaW50X3JhdGUgfiAuLCBkYXRhID0gc2FtcGxlZF90cmFpbl9kYXRhLCBudW0udHJlZXMgPSA1MDAsIHZlcmJvc2U9VFJVRSwgaW1wb3J0YW5jZSA9ICJpbXB1cml0eSIsIG9vYi5lcnJvciA9IFRSVUUpCgojIFByaW50IHRoZSBtb2RlbCBzdW1tYXJ5CnByaW50KCJSYW5kb20gRm9yZXN0IE1vZGVsIFN1bW1hcnk6IikKcHJpbnQocmYpCgojIE1ha2UgcHJlZGljdGlvbnMgb24gdGhlIHRyYWluaW5nIGFuZCB0ZXN0aW5nIGRhdGEKcmYudHJhaW5fcHJlZGljdGlvbnMgPC0gcHJlZGljdChyZiwgZGF0YSA9IHNhbXBsZWRfdHJhaW5fZGF0YSkKcmYudGVzdF9wcmVkaWN0aW9ucyA8LSBwcmVkaWN0KHJmLCBkYXRhID0gc2FtcGxlZF90ZXN0X2RhdGEpCgojIENhbGN1bGF0ZSBNZWFuIFNxdWFyZWQgRXJyb3IgKE1TRSkgZm9yIHRyYWluaW5nIGFuZCB0ZXN0aW5nCnJmLnRyYWluX21zZSA8LSBtZWFuKChyZi50cmFpbl9wcmVkaWN0aW9ucyRwcmVkaWN0aW9ucyAtIHNhbXBsZWRfdHJhaW5fZGF0YSRpbnRfcmF0ZSleMikKcmYudGVzdF9tc2UgPC0gbWVhbigocmYudGVzdF9wcmVkaWN0aW9ucyRwcmVkaWN0aW9ucyAtIHNhbXBsZWRfdGVzdF9kYXRhJGludF9yYXRlKV4yKQoKIyBDYWxjdWxhdGUgUm9vdCBNZWFuIFNxdWFyZWQgRXJyb3IgKFJNU0UpIGZvciB0cmFpbmluZyBhbmQgdGVzdGluZwpyZi50cmFpbl9ybXNlIDwtIHNxcnQocmYudHJhaW5fbXNlKQpyZi50ZXN0X3Jtc2UgPC0gc3FydChyZi50ZXN0X21zZSkKCiMgQ2FsY3VsYXRlIE1lYW4gQWJzb2x1dGUgRXJyb3IgKE1BRSkgZm9yIHRyYWluaW5nIGFuZCB0ZXN0aW5nCnJmLnRyYWluX21hZSA8LSBtZWFuKGFicyhyZi50cmFpbl9wcmVkaWN0aW9ucyRwcmVkaWN0aW9ucyAtIHNhbXBsZWRfdHJhaW5fZGF0YSRpbnRfcmF0ZSkpCnJmLnRlc3RfbWFlIDwtIG1lYW4oYWJzKHJmLnRlc3RfcHJlZGljdGlvbnMkcHJlZGljdGlvbnMgLSBzYW1wbGVkX3Rlc3RfZGF0YSRpbnRfcmF0ZSkpCgojIENhbGN1bGF0ZSBSLXNxdWFyZWQgKFLCsikgZm9yIHRyYWluaW5nIGFuZCB0ZXN0aW5nCnJmLnRyYWluX3IyIDwtIDEgLSAoc3VtKChzYW1wbGVkX3RyYWluX2RhdGEkaW50X3JhdGUgLSByZi50cmFpbl9wcmVkaWN0aW9ucyRwcmVkaWN0aW9ucyleMikgLyBzdW0oKHNhbXBsZWRfdHJhaW5fZGF0YSRpbnRfcmF0ZSAtIG1lYW4oc2FtcGxlZF90cmFpbl9kYXRhJGludF9yYXRlKSleMikpCnJmLnRlc3RfcjIgPC0gMSAtIChzdW0oKHNhbXBsZWRfdGVzdF9kYXRhJGludF9yYXRlIC0gcmYudGVzdF9wcmVkaWN0aW9ucyRwcmVkaWN0aW9ucyleMikgLyBzdW0oKHNhbXBsZWRfdGVzdF9kYXRhJGludF9yYXRlIC0gbWVhbihzYW1wbGVkX3Rlc3RfZGF0YSRpbnRfcmF0ZSkpXjIpKQoKIyBEaXNwbGF5IHRoZSBtZXRyaWNzCmNhdCgiVHJhaW5pbmcgTVNFOiIsIHJmLnRyYWluX21zZSwgIlxuIikKY2F0KCJUZXN0aW5nIE1TRToiLCByZi50ZXN0X21zZSwgIlxuIikKY2F0KCJUcmFpbmluZyBSTVNFOiIsIHJmLnRyYWluX3Jtc2UsICJcbiIpCmNhdCgiVGVzdGluZyBSTVNFOiIsIHJmLnRlc3Rfcm1zZSwgIlxuIikKY2F0KCJUcmFpbmluZyBNQUU6IiwgcmYudHJhaW5fbWFlLCAiXG4iKQpjYXQoIlRlc3RpbmcgTUFFOiIsIHJmLnRlc3RfbWFlLCAiXG4iKQpjYXQoIlRyYWluaW5nIFItc3F1YXJlZCAoUsKyKToiLCByZi50cmFpbl9yMiwgIlxuIikKY2F0KCJUZXN0aW5nIFItc3F1YXJlZCAoUsKyKToiLCByZi50ZXN0X3IyLCAiXG4iKQojcmYgPC0gcmFuZG9tRm9yZXN0KGludF9yYXRlfi4sIGRhdGE9dHJhaW5fZGF0YSwgbnRyZWUgPSA1LCBtdHJ5ID0gMykKI2JhZy5ib3N0b249cmFuZG9tRm9yZXN0KG1lZHZ+LixkYXRhPUJvc3RvbixzdWJzZXQ9dHJhaW4sIG10cnk9MTMsaW1wb3J0YW5jZSA9VFJVRSkKI3ByaW50KHJmKQoKIyBTZXQgdGhlIG51bWJlciBvZiBjb3JlcyB5b3Ugd2FudCB0byB1c2UKI251bV9jb3JlcyA8LSA2ICAjIEFkanVzdCB0aGlzIG51bWJlciBiYXNlZCBvbiB5b3VyIHN5c3RlbSdzIGNhcGFiaWxpdGllcwoKIyBSZWdpc3RlciBwYXJhbGxlbCBiYWNrZW5kCiNjbCA8LSBtYWtlQ2x1c3RlcihudW1fY29yZXMpCiNyZWdpc3RlckRvUGFyYWxsZWwoY2wpCgojIEFzc3VtaW5nICdsY19kYXRhJyBpcyB5b3VyIGRhdGFzZXQKI3JmX21vZGVsIDwtIGZvcmVhY2gobnRyZWUgPSByZXAoMTAwLCBudW1fY29yZXMpLCAucGFja2FnZXMgPSAncmFuZG9tRm9yZXN0JykgJWRvcGFyJSB7CiMgICAgcmFuZG9tRm9yZXN0KGludF9yYXRlIH4gLiwgZGF0YSA9IGxjX2RhdGEsIG50cmVlID0gbnRyZWUsIG10cnkgPSBzcXJ0KG5jb2wobGNfZGF0YSkpKQojfQoKIyBBZnRlciB0cmFpbmluZywgc3RvcCB0aGUgY2x1c3RlciB0byByZWxlYXNlIHRoZSBjb3JlczoKI3N0b3BDbHVzdGVyKGNsKQoKIyMjIyBCb29zdGluZyAjIyMjCgojIERlZmluZSB0aGUgdGFyZ2V0IHZhcmlhYmxlIGZvciB0cmFpbmluZyBhbmQgdGVzdGluZwp4Z2IueV90cmFpbiA8LSBzYW1wbGVkX3RyYWluX2RhdGEkaW50X3JhdGUKeGdiLnlfdGVzdCA8LSBzYW1wbGVkX3Rlc3RfZGF0YSRpbnRfcmF0ZSAgIyBVc2Ugc2FtcGxlZF90ZXN0X2RhdGEgZm9yIHRlc3RpbmcKCiMgRGVmaW5lIHRoZSBmZWF0dXJlIG1hdHJpeCBmb3IgdHJhaW5pbmcgYW5kIHRlc3RpbmcgKGV4Y2x1ZGUgdGhlIHRhcmdldCB2YXJpYWJsZSkKeGdiLlhfdHJhaW4gPC0gc2FtcGxlZF90cmFpbl9kYXRhWywgLXdoaWNoKG5hbWVzKHNhbXBsZWRfdHJhaW5fZGF0YSkgPT0gJ2ludF9yYXRlJyldCnhnYi5YX3Rlc3QgPC0gc2FtcGxlZF90ZXN0X2RhdGFbLCAtd2hpY2gobmFtZXMoc2FtcGxlZF90ZXN0X2RhdGEpID09ICdpbnRfcmF0ZScpXSAgIyBVc2Ugc2FtcGxlZF90ZXN0X2RhdGEgZm9yIHRlc3RpbmcKCiMgRml0IGEgZ3JhZGllbnQgYm9vc3RpbmcgcmVncmVzc2lvbiBtb2RlbCB1c2luZyB4Z2Jvb3N0CnhnYiA8LSB4Z2Jvb3N0KAogIGRhdGEgPSBhcy5tYXRyaXgoeGdiLlhfdHJhaW4pLAogIGxhYmVsID0geGdiLnlfdHJhaW4sCiAgbnJvdW5kcyA9IDEwMCwKICB2ZXJib3NlID0gMAopCgojIE1ha2UgcHJlZGljdGlvbnMgb24gdGhlIHRyYWluaW5nIGFuZCB0ZXN0aW5nIGRhdGEKeGdiLnRyYWluX3ByZWRpY3Rpb25zIDwtIHByZWRpY3QoeGdiLCBuZXdkYXRhID0gYXMubWF0cml4KHhnYi5YX3RyYWluKSkKeGdiLnRlc3RfcHJlZGljdGlvbnMgPC0gcHJlZGljdCh4Z2IsIG5ld2RhdGEgPSBhcy5tYXRyaXgoeGdiLlhfdGVzdCkpCgojIENhbGN1bGF0ZSBNZWFuIFNxdWFyZWQgRXJyb3IgKE1TRSkgZm9yIHRyYWluaW5nIGFuZCB0ZXN0aW5nCnhnYi50cmFpbl9tc2UgPC0gbWVhbigoeGdiLnRyYWluX3ByZWRpY3Rpb25zIC0geGdiLnlfdHJhaW4pXjIpCnhnYi50ZXN0X21zZSA8LSBtZWFuKCh4Z2IudGVzdF9wcmVkaWN0aW9ucyAtIHhnYi55X3Rlc3QpXjIpCgojIENhbGN1bGF0ZSBSb290IE1lYW4gU3F1YXJlZCBFcnJvciAoUk1TRSkgZm9yIHRyYWluaW5nIGFuZCB0ZXN0aW5nCnhnYi50cmFpbl9ybXNlIDwtIHNxcnQoeGdiLnRyYWluX21zZSkKeGdiLnRlc3Rfcm1zZSA8LSBzcXJ0KHhnYi50ZXN0X21zZSkKCiMgQ2FsY3VsYXRlIE1lYW4gQWJzb2x1dGUgRXJyb3IgKE1BRSkgZm9yIHRyYWluaW5nIGFuZCB0ZXN0aW5nCnhnYi50cmFpbl9tYWUgPC0gbWVhbihhYnMoeGdiLnRyYWluX3ByZWRpY3Rpb25zIC0geGdiLnlfdHJhaW4pKQp4Z2IudGVzdF9tYWUgPC0gbWVhbihhYnMoeGdiLnRlc3RfcHJlZGljdGlvbnMgLSB4Z2IueV90ZXN0KSkKCiMgQ2FsY3VsYXRlIFItc3F1YXJlZCAoUsKyKSBmb3IgdHJhaW5pbmcgYW5kIHRlc3RpbmcKeGdiLnRyYWluX3IyIDwtIDEgLSAoc3VtKCh4Z2IueV90cmFpbiAtIHhnYi50cmFpbl9wcmVkaWN0aW9ucyleMikgLyBzdW0oKHhnYi55X3RyYWluIC0gbWVhbih4Z2IueV90cmFpbikpXjIpKQp4Z2IudGVzdF9yMiA8LSAxIC0gKHN1bSgoeGdiLnlfdGVzdCAtIHhnYi50ZXN0X3ByZWRpY3Rpb25zKV4yKSAvIHN1bSgoeGdiLnlfdGVzdCAtIG1lYW4oeGdiLnlfdGVzdCkpXjIpKQoKIyBEaXNwbGF5IHRoZSBtZXRyaWNzCmNhdCgiVHJhaW5pbmcgTVNFOiIsIHhnYi50cmFpbl9tc2UsICJcbiIpCmNhdCgiVGVzdGluZyBNU0U6IiwgeGdiLnRlc3RfbXNlLCAiXG4iKQpjYXQoIlRyYWluaW5nIFJNU0U6IiwgeGdiLnRyYWluX3Jtc2UsICJcbiIpCmNhdCgiVGVzdGluZyBSTVNFOiIsIHhnYi50ZXN0X3Jtc2UsICJcbiIpCmNhdCgiVHJhaW5pbmcgTUFFOiIsIHhnYi50cmFpbl9tYWUsICJcbiIpCmNhdCgiVGVzdGluZyBNQUU6IiwgeGdiLnRlc3RfbWFlLCAiXG4iKQpjYXQoIlRyYWluaW5nIFItc3F1YXJlZCAoUsKyKToiLCB4Z2IudHJhaW5fcjIsICJcbiIpCmNhdCgiVGVzdGluZyBSLXNxdWFyZWQgKFLCsik6IiwgeGdiLnRlc3RfcjIsICJcbiIpCmBgYApGb2xsb3dpbmcsIGEgc2NhdHRlciBwbG90IG9mIGFjdHVhbCB2cyBwcmVkaWN0ZWQgdHJhaW5pbmcgdmFsdWVzIGZvciBlYWNoIG1vZGVsIGlzIHBsb3QuClRoaXMgcGxvdCBoZWxwcyB1cyB2aXN1YWxpemUgaG93IHdlbGwgZWFjaCBtb2RlbCdzIHByZWRpY3Rpb25zIGFsaWduIHdpdGggdGhlIGFjdHVhbCBkYXRhIHBvaW50cy4KYGBge3J9CiMgQ3JlYXRlIGEgc2NhdHRlciBwbG90IGZ1bmN0aW9uCmNyZWF0ZV9zY2F0dGVyX3Bsb3QgPC0gZnVuY3Rpb24oYWN0dWFsX3ZhbHVlcywgcHJlZGljdGVkX3ZhbHVlcywgbW9kZWxfbmFtZSkgewogIG1vZGVsX2NvbXBhcmlzb25fZGF0YSA8LSBkYXRhLmZyYW1lKAogICAgQWN0dWFsID0gYWN0dWFsX3ZhbHVlcywKICAgIFByZWRpY3RlZCA9IHByZWRpY3RlZF92YWx1ZXMKICApCiAgCiAgc2NhdHRlcl9wbG90IDwtIGdncGxvdChtb2RlbF9jb21wYXJpc29uX2RhdGEsIGFlcyh4ID0gQWN0dWFsLCB5ID0gUHJlZGljdGVkKSkgKwogICAgZ2VvbV9wb2ludCgpICsKICAgIGdlb21fYWJsaW5lKGludGVyY2VwdCA9IDAsIHNsb3BlID0gMSwgbGluZXR5cGUgPSAiZGFzaGVkIiwgY29sb3IgPSAicmVkIikgKyAgIyBBZGQgYSBkaWFnb25hbCByZWZlcmVuY2UgbGluZQogICAgbGFicyh4ID0gIkFjdHVhbCBUcmFpbmluZyBWYWx1ZXMiLCB5ID0gIlByZWRpY3RlZCBUcmFpbmluZyBWYWx1ZXMiLCB0aXRsZSA9IG1vZGVsX25hbWUpICsKICAgIHRoZW1lX21pbmltYWwoKSArCiAgICB5bGltKC01MCwgNTApCiAgCiAgcmV0dXJuKHNjYXR0ZXJfcGxvdCkKfQoKIyBDcmVhdGUgc2NhdHRlciBwbG90cyBmb3IgZWFjaCBtb2RlbApsbV9zY2F0dGVyX3Bsb3QgPC0gY3JlYXRlX3NjYXR0ZXJfcGxvdCgKICBhY3R1YWxfdmFsdWVzID0gc2FtcGxlZF90cmFpbl9kYXRhJGludF9yYXRlLAogIHByZWRpY3RlZF92YWx1ZXMgPSBsbS50cmFpbl9wcmVkaWN0aW9ucywKICBtb2RlbF9uYW1lID0gIkxpbmVhciBSZWdyZXNzaW9uIgopCgpyZl9zY2F0dGVyX3Bsb3QgPC0gY3JlYXRlX3NjYXR0ZXJfcGxvdCgKICBhY3R1YWxfdmFsdWVzID0gc2FtcGxlZF90cmFpbl9kYXRhJGludF9yYXRlLAogIHByZWRpY3RlZF92YWx1ZXMgPSByZi50cmFpbl9wcmVkaWN0aW9ucyRwcmVkaWN0aW9ucywKICBtb2RlbF9uYW1lID0gIlJhbmRvbSBGb3Jlc3QiCikKCnhnYl9zY2F0dGVyX3Bsb3QgPC0gY3JlYXRlX3NjYXR0ZXJfcGxvdCgKICBhY3R1YWxfdmFsdWVzID0geGdiLnlfdHJhaW4sCiAgcHJlZGljdGVkX3ZhbHVlcyA9IHhnYi50cmFpbl9wcmVkaWN0aW9ucywKICBtb2RlbF9uYW1lID0gIlhHQm9vc3QiCikKCiMgRGlzcGxheSB0aGUgc2NhdHRlciBwbG90cyBzZXBhcmF0ZWx5CnByaW50KGxtX3NjYXR0ZXJfcGxvdCkKcHJpbnQocmZfc2NhdHRlcl9wbG90KQpwcmludCh4Z2Jfc2NhdHRlcl9wbG90KQpgYGAKRm9sbG93aW5nLCBhIHNjYXR0ZXIgcGxvdCBvZiBhY3R1YWwgdnMgcHJlZGljdGVkIHRlc3RpbmcgdmFsdWVzIGZvciBlYWNoIG1vZGVsIGlzIHBsb3QuClRoaXMgcGxvdCBoZWxwcyB1cyB2aXN1YWxpemUgaG93IHdlbGwgZWFjaCBtb2RlbCdzIHByZWRpY3Rpb25zIGFsaWduIHdpdGggdGhlIGFjdHVhbCBkYXRhIHBvaW50cy4KYGBge3J9CiMgQ3JlYXRlIGEgc2NhdHRlciBwbG90IGZ1bmN0aW9uCmNyZWF0ZV9zY2F0dGVyX3Bsb3QgPC0gZnVuY3Rpb24oYWN0dWFsX3ZhbHVlcywgcHJlZGljdGVkX3ZhbHVlcywgbW9kZWxfbmFtZSkgewogIG1vZGVsX2NvbXBhcmlzb25fZGF0YSA8LSBkYXRhLmZyYW1lKAogICAgQWN0dWFsID0gYWN0dWFsX3ZhbHVlcywKICAgIFByZWRpY3RlZCA9IHByZWRpY3RlZF92YWx1ZXMKICApCiAgCiAgc2NhdHRlcl9wbG90IDwtIGdncGxvdChtb2RlbF9jb21wYXJpc29uX2RhdGEsIGFlcyh4ID0gQWN0dWFsLCB5ID0gUHJlZGljdGVkKSkgKwogICAgZ2VvbV9wb2ludCgpICsKICAgIGdlb21fYWJsaW5lKGludGVyY2VwdCA9IDAsIHNsb3BlID0gMSwgbGluZXR5cGUgPSAiZGFzaGVkIiwgY29sb3IgPSAicmVkIikgKyAgIyBBZGQgYSBkaWFnb25hbCByZWZlcmVuY2UgbGluZQogICAgbGFicyh4ID0gIkFjdHVhbCBUZXN0aW5nIFZhbHVlcyIsIHkgPSAiUHJlZGljdGVkIFRlc3RpbmcgVmFsdWVzIiwgdGl0bGUgPSBtb2RlbF9uYW1lKSArCiAgICB0aGVtZV9taW5pbWFsKCkgKwogICAgeWxpbSgtNTAsIDUwKSArCiAgICB4bGltKDAsIDQwKQogIAogIHJldHVybihzY2F0dGVyX3Bsb3QpCn0KCiMgQ3JlYXRlIHNjYXR0ZXIgcGxvdHMgZm9yIGVhY2ggbW9kZWwKbG1fc2NhdHRlcl9wbG90IDwtIGNyZWF0ZV9zY2F0dGVyX3Bsb3QoCiAgYWN0dWFsX3ZhbHVlcyA9IHNhbXBsZWRfdGVzdF9kYXRhJGludF9yYXRlLAogIHByZWRpY3RlZF92YWx1ZXMgPSBsbS50ZXN0X3ByZWRpY3Rpb25zLAogIG1vZGVsX25hbWUgPSAiTGluZWFyIFJlZ3Jlc3Npb24iCikKCnJmX3NjYXR0ZXJfcGxvdCA8LSBjcmVhdGVfc2NhdHRlcl9wbG90KAogIGFjdHVhbF92YWx1ZXMgPSBzYW1wbGVkX3Rlc3RfZGF0YSRpbnRfcmF0ZSwKICBwcmVkaWN0ZWRfdmFsdWVzID0gcmYudGVzdF9wcmVkaWN0aW9ucyRwcmVkaWN0aW9ucywKICBtb2RlbF9uYW1lID0gIlJhbmRvbSBGb3Jlc3QiCikKCnhnYl9zY2F0dGVyX3Bsb3QgPC0gY3JlYXRlX3NjYXR0ZXJfcGxvdCgKICBhY3R1YWxfdmFsdWVzID0geGdiLnlfdGVzdCwKICBwcmVkaWN0ZWRfdmFsdWVzID0geGdiLnRlc3RfcHJlZGljdGlvbnMsCiAgbW9kZWxfbmFtZSA9ICJYR0Jvb3N0IgopCgojIERpc3BsYXkgdGhlIHNjYXR0ZXIgcGxvdHMgc2VwYXJhdGVseQpwcmludChsbV9zY2F0dGVyX3Bsb3QpCnByaW50KHJmX3NjYXR0ZXJfcGxvdCkKcHJpbnQoeGdiX3NjYXR0ZXJfcGxvdCkKYGBgCgpSZXNpZHVhbCBwbG90cyBjYW4gaGVscCBpZGVudGlmeSBwYXR0ZXJucyBpbiBwcmVkaWN0aW9uIGVycm9ycyBhbmQgYXNzZXNzIHdoZXRoZXIgdGhlIGFzc3VtcHRpb25zIG9mIGxpbmVhciByZWdyZXNzaW9uIChpZiBhcHBsaWNhYmxlKSBhcmUgbWV0LgpgYGB7cn0KIyBDcmVhdGUgYSByZXNpZHVhbCBwbG90IGZ1bmN0aW9uCmNyZWF0ZV9yZXNpZHVhbF9wbG90IDwtIGZ1bmN0aW9uKGFjdHVhbF92YWx1ZXMsIHByZWRpY3RlZF92YWx1ZXMsIG1vZGVsX25hbWUpIHsKICByZXNpZHVhbHMgPC0gYWN0dWFsX3ZhbHVlcyAtIHByZWRpY3RlZF92YWx1ZXMKICByZXNpZHVhbF9kYXRhIDwtIGRhdGEuZnJhbWUoCiAgICBQcmVkaWN0ZWQgPSBwcmVkaWN0ZWRfdmFsdWVzLAogICAgUmVzaWR1YWxzID0gcmVzaWR1YWxzCiAgKQogIAogIHJlc2lkdWFsX3Bsb3QgPC0gZ2dwbG90KHJlc2lkdWFsX2RhdGEsIGFlcyh4ID0gUHJlZGljdGVkLCB5ID0gUmVzaWR1YWxzKSkgKwogICAgZ2VvbV9wb2ludCgpICsKICAgIGdlb21faGxpbmUoeWludGVyY2VwdCA9IDAsIGxpbmV0eXBlID0gImRhc2hlZCIsIGNvbG9yID0gInJlZCIpICsgICMgUmVkIGhvcml6b250YWwgcmVmZXJlbmNlIGxpbmUKICAgIGxhYnMoeCA9ICJQcmVkaWN0ZWQgVmFsdWVzIiwgeSA9ICJSZXNpZHVhbHMiLCB0aXRsZSA9IHBhc3RlKCJSZXNpZHVhbCBQbG90IC0iLCBtb2RlbF9uYW1lKSkgKwogICAgdGhlbWVfbWluaW1hbCgpICsKICAgIHlsaW0oLTMwLCAzMCkgKwogICAgeGxpbSgwLCA0MCkKICAKICByZXR1cm4ocmVzaWR1YWxfcGxvdCkKfQoKIyBDcmVhdGUgcmVzaWR1YWwgcGxvdHMgZm9yIGVhY2ggbW9kZWwKbG1fcmVzaWR1YWxfcGxvdCA8LSBjcmVhdGVfcmVzaWR1YWxfcGxvdCgKICBhY3R1YWxfdmFsdWVzID0gc2FtcGxlZF90cmFpbl9kYXRhJGludF9yYXRlLAogIHByZWRpY3RlZF92YWx1ZXMgPSBsbS50cmFpbl9wcmVkaWN0aW9ucywKICBtb2RlbF9uYW1lID0gIkxpbmVhciBSZWdyZXNzaW9uIgopCgpyZl9yZXNpZHVhbF9wbG90IDwtIGNyZWF0ZV9yZXNpZHVhbF9wbG90KAogIGFjdHVhbF92YWx1ZXMgPSBzYW1wbGVkX3RyYWluX2RhdGEkaW50X3JhdGUsCiAgcHJlZGljdGVkX3ZhbHVlcyA9IHJmLnRyYWluX3ByZWRpY3Rpb25zJHByZWRpY3Rpb25zLAogIG1vZGVsX25hbWUgPSAiUmFuZG9tIEZvcmVzdCIKKQoKeGdiX3Jlc2lkdWFsX3Bsb3QgPC0gY3JlYXRlX3Jlc2lkdWFsX3Bsb3QoCiAgYWN0dWFsX3ZhbHVlcyA9IHhnYi55X3RyYWluLAogIHByZWRpY3RlZF92YWx1ZXMgPSB4Z2IudHJhaW5fcHJlZGljdGlvbnMsCiAgbW9kZWxfbmFtZSA9ICJYR0Jvb3N0IgopCgojIERpc3BsYXkgdGhlIHJlc2lkdWFsIHBsb3RzIHNlcGFyYXRlbHkKcHJpbnQobG1fcmVzaWR1YWxfcGxvdCkKcHJpbnQocmZfcmVzaWR1YWxfcGxvdCkKcHJpbnQoeGdiX3Jlc2lkdWFsX3Bsb3QpCmBgYApGcm9tIHRoZSBwbG90cyBhYm92ZSB3ZSBjYW4gY2xlYXJseSBzZWUgdGhhdDoKCi0gICBMaW5lYXIgUmVncmVzc2lvbiBSZXNpZHVhbCBQbG90OgogICAgLSAgIFBhdHRlcm46IFRoZXJlIGFwcGVhcnMgdG8gYmUgYSBjbGVhciBwYXR0ZXJuIGluIHRoZSByZXNpZHVhbHMsIHdpdGggYSBmdW5uZWwgc2hhcGUgdGhhdCB3aWRlbnMgYXMgdGhlIHByZWRpY3RlZCB2YWx1ZXMgaW5jcmVhc2UuIFRoaXMgc3VnZ2VzdHMgaGV0ZXJvc2NlZGFzdGljaXR5LCB3aGVyZSB0aGUgdmFyaWFuY2Ugb2YgdGhlIHJlc2lkdWFscyBpcyBub3QgY29uc3RhbnQgYWNyb3NzIHRoZSByYW5nZSBvZiBwcmVkaWN0ZWQgdmFsdWVzLgogICAgLSAgIE91dGxpZXJzOiBUaGVyZSBhcmUgc2V2ZXJhbCBwcm9taW5lbnQgb3V0bGllcnMsIHBhcnRpY3VsYXJseSBmb3IgaGlnaGVyIHByZWRpY3RlZCB2YWx1ZXMuIFRoZXNlIHBvaW50cyBzaWduaWZpY2FudGx5IGRldmlhdGUgZnJvbSB0aGUgcmVkIGRhc2hlZCBsaW5lLCB3aGljaCByZXByZXNlbnRzIHplcm8gcmVzaWR1YWxzLgotICAgUmFuZG9tIEZvcmVzdCBSZXNpZHVhbCBQbG90OgogICAgLSAgIFBhdHRlcm46IFRoZSByZXNpZHVhbHMgc2VlbSB0byBiZSByYW5kb21seSBkaXNwZXJzZWQgYXJvdW5kIHRoZSB6ZXJvIGxpbmUgYXQgbG93ZXIgcHJlZGljdGVkIHZhbHVlcywgd2hpY2ggaXMgYSBnb29kIHNpZ24uIEhvd2V2ZXIsIGFzIHByZWRpY3RlZCB2YWx1ZXMgaW5jcmVhc2UsIHRoZSByZXNpZHVhbHMgYWxzbyBpbmNyZWFzZSwgc3VnZ2VzdGluZyBhIHN5c3RlbWF0aWMgZXJyb3IgaW4gdGhlIG1vZGVsIHByZWRpY3Rpb25zLgogICAgLSAgIENvbmNlbnRyYXRpb246IFRoZXJlIGlzIGEgaGlnaGVyIGNvbmNlbnRyYXRpb24gb2YgcmVzaWR1YWxzIGFyb3VuZCB0aGUgemVybyBsaW5lIGNvbXBhcmVkIHRvIHRoZSBMaW5lYXIgUmVncmVzc2lvbiBtb2RlbCwgd2hpY2ggY291bGQgaW5kaWNhdGUgYSBiZXR0ZXIgZml0Ci0gICAgWEdCb29zdCBSZXNpZHVhbCBQbG90OgogICAgLSAgIFBhdHRlcm46IFRoZSByZXNpZHVhbHMgaW4gdGhpcyBwbG90IGFyZSBtb3JlIGV2ZW5seSBkaXNwZXJzZWQgYWNyb3NzIHRoZSBwcmVkaWN0ZWQgdmFsdWVzIHRoYW4gaW4gdGhlIExpbmVhciBSZWdyZXNzaW9uIHBsb3QsIHN1Z2dlc3RpbmcgYSBtb3JlIGNvbnNpc3RlbnQgdmFyaWFuY2UgKGhvbW9zY2VkYXN0aWNpdHkpIGFuZCBwb3RlbnRpYWxseSBhIGJldHRlciBmaXQuCiAgICAtICAgT3V0bGllcnM6IFRoaXMgcGxvdCBhbHNvIHNob3dzIG91dGxpZXJzLCBidXQgdGhleSBkbyBub3QgYXBwZWFyIGFzIGV4dHJlbWUgYXMgaW4gdGhlIExpbmVhciBSZWdyZXNzaW9uIHBsb3QuIFRoZSBzcHJlYWQgb2YgcmVzaWR1YWxzIGlzIG5hcnJvd2VyIGNvbXBhcmVkIHRvIHRoZSBSYW5kb20gRm9yZXN0IHBsb3QuCi0gICBDb21wYXJpc29uOgogICAgLSAgIEhldGVyb3NjZWRhc3RpY2l0eTogVGhlIExpbmVhciBSZWdyZXNzaW9uIG1vZGVsIGV4aGliaXRzIGNsZWFyIGhldGVyb3NjZWRhc3RpY2l0eSwgd2hpY2ggaXMgYSBzaWduIG9mIG1vZGVsIGluYWRlcXVhY3kuIFRoaXMgY291bGQgYmUgaW1wcm92ZWQgd2l0aCB0cmFuc2Zvcm1hdGlvbnMgb3IgdXNpbmcgbW9kZWxzIHRoYXQgaGFuZGxlIG5vbi1jb25zdGFudCB2YXJpYW5jZSBiZXR0ZXIuCiAgICAtICAgTW9kZWwgRml0OiBUaGUgUmFuZG9tIEZvcmVzdCBtb2RlbCBzZWVtcyB0byBmaXQgdGhlIGxvd2VyIHJhbmdlIG9mIHByZWRpY3RlZCB2YWx1ZXMgd2VsbCBidXQgc2hvd3MgaW5jcmVhc2luZyByZXNpZHVhbHMgd2l0aCBoaWdoZXIgcHJlZGljdGVkIHZhbHVlcywgd2hpY2ggY291bGQgaW5kaWNhdGUgb3ZlcmZpdHRpbmcgb3IgYSBsYWNrIG9mIGdlbmVyYWxpemF0aW9uIGZvciBoaWdoZXIgdmFsdWVzLgogICAgLSAgIENvbnNpc3RlbmN5OiBUaGUgWEdCb29zdCBtb2RlbCBzZWVtcyB0byBzaG93IGEgbW9yZSBjb25zaXN0ZW50IHNwcmVhZCBvZiByZXNpZHVhbHMgYXJvdW5kIHRoZSB6ZXJvIGxpbmUsIHdoaWNoIGlzIGluZGljYXRpdmUgb2YgYSBtb2RlbCB0aGF0IGhhcyBhIGNvbnNpc3RlbnQgcGVyZm9ybWFuY2UgYWNyb3NzIHRoZSByYW5nZSBvZiBwcmVkaWN0ZWQgdmFsdWVzLgogICAgLSAgIE91dGxpZXJzOiBBbGwgdGhyZWUgbW9kZWxzIGhhdmUgb3V0bGllcnMsIGJ1dCB0aGVpciBpbXBhY3Qgc2VlbXMgbW9zdCBwcm9ub3VuY2VkIGluIHRoZSBMaW5lYXIgUmVncmVzc2lvbiBtb2RlbC4KClRoaXMgdmlzdWFsaXphdGlvbiBjYW4gaGVscCB5b3UgY29tcGFyZSB0aGUgZGlzdHJpYnV0aW9uIG9mIHByZWRpY3Rpb24gZXJyb3JzIGFjcm9zcyBtb2RlbHMuCmBgYHtyfQojIENyZWF0ZSBhIGRlbnNpdHkgcGxvdCBmdW5jdGlvbiBmb3IgcmVzaWR1YWxzCmNyZWF0ZV9yZXNpZHVhbF9kZW5zaXR5X3Bsb3QgPC0gZnVuY3Rpb24oYWN0dWFsX3ZhbHVlcywgcHJlZGljdGVkX3ZhbHVlcywgbW9kZWxfbmFtZSkgewogIHJlc2lkdWFscyA8LSBhY3R1YWxfdmFsdWVzIC0gcHJlZGljdGVkX3ZhbHVlcwogIHJlc2lkdWFsX2RhdGEgPC0gZGF0YS5mcmFtZShSZXNpZHVhbHMgPSByZXNpZHVhbHMpCiAgCiAgZGVuc2l0eV9wbG90IDwtIGdncGxvdChyZXNpZHVhbF9kYXRhLCBhZXMoeCA9IFJlc2lkdWFscykpICsKICAgIGdlb21fZGVuc2l0eShmaWxsID0gInNreWJsdWUiLCBjb2xvciA9ICJibGFjayIsIGFscGhhID0gMC43KSArCiAgICBsYWJzKHggPSAiUmVzaWR1YWxzIiwgeSA9ICJEZW5zaXR5IiwgdGl0bGUgPSBwYXN0ZSgiUmVzaWR1YWwgRGVuc2l0eSBQbG90IC0iLCBtb2RlbF9uYW1lKSkgKwogICAgdGhlbWVfbWluaW1hbCgpCiAgCiAgcmV0dXJuKGRlbnNpdHlfcGxvdCkKfQoKIyBDcmVhdGUgZGVuc2l0eSBwbG90cyBmb3IgcmVzaWR1YWxzIGZvciBlYWNoIG1vZGVsCmxtX3Jlc2lkdWFsX2RlbnNpdHlfcGxvdCA8LSBjcmVhdGVfcmVzaWR1YWxfZGVuc2l0eV9wbG90KAogIGFjdHVhbF92YWx1ZXMgPSBzYW1wbGVkX3RyYWluX2RhdGEkaW50X3JhdGUsCiAgcHJlZGljdGVkX3ZhbHVlcyA9IGxtLnRyYWluX3ByZWRpY3Rpb25zLAogIG1vZGVsX25hbWUgPSAiTGluZWFyIFJlZ3Jlc3Npb24iCikKCnJmX3Jlc2lkdWFsX2RlbnNpdHlfcGxvdCA8LSBjcmVhdGVfcmVzaWR1YWxfZGVuc2l0eV9wbG90KAogIGFjdHVhbF92YWx1ZXMgPSBzYW1wbGVkX3RyYWluX2RhdGEkaW50X3JhdGUsCiAgcHJlZGljdGVkX3ZhbHVlcyA9IHJmLnRyYWluX3ByZWRpY3Rpb25zJHByZWRpY3Rpb25zLAogIG1vZGVsX25hbWUgPSAiUmFuZG9tIEZvcmVzdCIKKQoKeGdiX3Jlc2lkdWFsX2RlbnNpdHlfcGxvdCA8LSBjcmVhdGVfcmVzaWR1YWxfZGVuc2l0eV9wbG90KAogIGFjdHVhbF92YWx1ZXMgPSB4Z2IueV90cmFpbiwKICBwcmVkaWN0ZWRfdmFsdWVzID0geGdiLnRyYWluX3ByZWRpY3Rpb25zLAogIG1vZGVsX25hbWUgPSAiWEdCb29zdCIKKQoKIyBEaXNwbGF5IHRoZSBkZW5zaXR5IHBsb3RzIHNlcGFyYXRlbHkKcHJpbnQobG1fcmVzaWR1YWxfZGVuc2l0eV9wbG90KQpwcmludChyZl9yZXNpZHVhbF9kZW5zaXR5X3Bsb3QpCnByaW50KHhnYl9yZXNpZHVhbF9kZW5zaXR5X3Bsb3QpCmBgYAoKVGhpcyB2aXN1YWxpemF0aW9uIGNhbiBoZWxwIHlvdSBjb21wYXJlIHRoZSBkaXN0cmlidXRpb24gb2YgcHJlZGljdGlvbiBlcnJvcnMgYWNyb3NzIG1vZGVscyB0aHJvdWdoIGhpc3RvZ3JhbXMuCgpgYGB7cn0KIyBDcmVhdGUgYSBoaXN0b2dyYW0gcGxvdCBmdW5jdGlvbiBmb3IgcmVzaWR1YWxzIHdpdGggYSByZWQgZGVuc2l0eSBjdXJ2ZQpjcmVhdGVfcmVzaWR1YWxfaGlzdG9ncmFtX3Bsb3QgPC0gZnVuY3Rpb24oYWN0dWFsX3ZhbHVlcywgcHJlZGljdGVkX3ZhbHVlcywgbW9kZWxfbmFtZSkgewogIHJlc2lkdWFscyA8LSBhY3R1YWxfdmFsdWVzIC0gcHJlZGljdGVkX3ZhbHVlcwogIHJlc2lkdWFsX2RhdGEgPC0gZGF0YS5mcmFtZShSZXNpZHVhbHMgPSByZXNpZHVhbHMpCiAgCiAgaGlzdG9ncmFtX3Bsb3QgPC0gZ2dwbG90KHJlc2lkdWFsX2RhdGEsIGFlcyh4ID0gUmVzaWR1YWxzKSkgKwogICAgZ2VvbV9oaXN0b2dyYW0oYWVzKHkgPSBhZnRlcl9zdGF0KGRlbnNpdHkpKSwgYmlucyA9IDMwLCBmaWxsID0gInNreWJsdWUiLCBjb2xvciA9ICJibGFjayIsIGFscGhhID0gMC43KSArICAjIFVzZSBkZW5zaXR5IG9uIHRoZSB5LWF4aXMgZm9yIHRoZSBoaXN0b2dyYW0KICAgIGdlb21fZGVuc2l0eShjb2xvciA9ICJyZWQiLCBsaW5ld2lkdGggPSAxLjUpICsgICMgQWRkIHRoZSBkZW5zaXR5IHBsb3QgaW4gcmVkCiAgICBsYWJzKHggPSAiUmVzaWR1YWxzIiwgeSA9ICJEZW5zaXR5IiwgdGl0bGUgPSBwYXN0ZSgiUmVzaWR1YWwgSGlzdG9ncmFtIFBsb3Qgd2l0aCBEZW5zaXR5IEN1cnZlIC0iLCBtb2RlbF9uYW1lKSkgKwogICAgdGhlbWVfbWluaW1hbCgpICsKICAgIHhsaW0oLTIwLDIwKSArIAogICAgeWxpbSgwLCAwLjMpCiAgCiAgcmV0dXJuKGhpc3RvZ3JhbV9wbG90KQp9CgojIENyZWF0ZSBoaXN0b2dyYW0gcGxvdHMgZm9yIHJlc2lkdWFscyBmb3IgZWFjaCBtb2RlbApsbV9yZXNpZHVhbF9oaXN0b2dyYW1fcGxvdCA8LSBjcmVhdGVfcmVzaWR1YWxfaGlzdG9ncmFtX3Bsb3QoCiAgYWN0dWFsX3ZhbHVlcyA9IHNhbXBsZWRfdHJhaW5fZGF0YSRpbnRfcmF0ZSwKICBwcmVkaWN0ZWRfdmFsdWVzID0gbG0udHJhaW5fcHJlZGljdGlvbnMsCiAgbW9kZWxfbmFtZSA9ICJMaW5lYXIgUmVncmVzc2lvbiIKKQoKcmZfcmVzaWR1YWxfaGlzdG9ncmFtX3Bsb3QgPC0gY3JlYXRlX3Jlc2lkdWFsX2hpc3RvZ3JhbV9wbG90KAogIGFjdHVhbF92YWx1ZXMgPSBzYW1wbGVkX3RyYWluX2RhdGEkaW50X3JhdGUsCiAgcHJlZGljdGVkX3ZhbHVlcyA9IHJmLnRyYWluX3ByZWRpY3Rpb25zJHByZWRpY3Rpb25zLAogIG1vZGVsX25hbWUgPSAiUmFuZG9tIEZvcmVzdCIKKQoKeGdiX3Jlc2lkdWFsX2hpc3RvZ3JhbV9wbG90IDwtIGNyZWF0ZV9yZXNpZHVhbF9oaXN0b2dyYW1fcGxvdCgKICBhY3R1YWxfdmFsdWVzID0geGdiLnlfdHJhaW4sCiAgcHJlZGljdGVkX3ZhbHVlcyA9IHhnYi50cmFpbl9wcmVkaWN0aW9ucywKICBtb2RlbF9uYW1lID0gIlhHQm9vc3QiCikKCiMgRGlzcGxheSB0aGUgaGlzdG9ncmFtIHBsb3RzIHNlcGFyYXRlbHkKcHJpbnQobG1fcmVzaWR1YWxfaGlzdG9ncmFtX3Bsb3QpCnByaW50KHJmX3Jlc2lkdWFsX2hpc3RvZ3JhbV9wbG90KQpwcmludCh4Z2JfcmVzaWR1YWxfaGlzdG9ncmFtX3Bsb3QpCmBgYAoKRm9yIGVhY2ggbW9kZWwgYSBiYXIgY2hhcnQgdGhhdCBkaXNwbGF5cyB0aGUgUi1zcXVhcmVkIChjb2VmZmljaWVudCBvZiBkZXRlcm1pbmF0aW9uKSB2YWx1ZXMgaXMgY3JlYXRlZC4KUi1zcXVhcmVkIG1lYXN1cmVzIHRoZSBwcm9wb3J0aW9uIG9mIHZhcmlhbmNlIGluIHRoZSB0YXJnZXQgdmFyaWFibGUgZXhwbGFpbmVkIGJ5IHRoZSBtb2RlbC4gSGlnaGVyIFItc3F1YXJlZCB2YWx1ZXMgaW5kaWNhdGUgYmV0dGVyIG1vZGVsIGZpdC4KYGBge3J9CiMgQ3JlYXRlIGEgZGF0YSBmcmFtZSB3aXRoIFItc3F1YXJlZCB2YWx1ZXMgZm9yIGVhY2ggbW9kZWwKbW9kZWxfbmFtZXMgPC0gYygiTGluZWFyIFJlZ3Jlc3Npb24iLCAiUmFuZG9tIEZvcmVzdCIsICJYR0Jvb3N0IikKcl9zcXVhcmVkX3ZhbHVlcyA8LSBjKAogIGxtLnRyYWluX3IyLAogIHJmLnRyYWluX3IyLAogIHhnYi50cmFpbl9yMgopCgpyX3NxdWFyZWRfZGF0YSA8LSBkYXRhLmZyYW1lKE1vZGVsID0gZmFjdG9yKG1vZGVsX25hbWVzKSwKICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgUl9zcXVhcmVkID0gcl9zcXVhcmVkX3ZhbHVlcykKCiMgQ3JlYXRlIHRoZSBSLXNxdWFyZWQgY29tcGFyaXNvbiBiYXIgY2hhcnQKcl9zcXVhcmVkX2Jhcl9jaGFydCA8LSBnZ3Bsb3Qocl9zcXVhcmVkX2RhdGEsIGFlcyh4ID0gTW9kZWwsIHkgPSBSX3NxdWFyZWQsIGZpbGwgPSBNb2RlbCkpICsKICBnZW9tX2JhcihzdGF0ID0gImlkZW50aXR5IikgKwogIGxhYnMoeCA9ICJNb2RlbCIsIHkgPSAiUi1zcXVhcmVkIChSwrIpIiwgdGl0bGUgPSAiUi1zcXVhcmVkIENvbXBhcmlzb24iKSArCiAgdGhlbWVfbWluaW1hbCgpICsKICB0aGVtZShheGlzLnRleHQueCA9IGVsZW1lbnRfdGV4dChhbmdsZSA9IDQ1LCBoanVzdCA9IDEpKQoKIyBEaXNwbGF5IHRoZSBSLXNxdWFyZWQgY29tcGFyaXNvbiBiYXIgY2hhcnQKcHJpbnQocl9zcXVhcmVkX2Jhcl9jaGFydCkKYGBgCkEgYmFyIGNoYXJ0IHRoYXQgY29tcGFyZXMgdGhlIE1BRSBvciBSTVNFIHZhbHVlcywgaXMgZ2VuZXJhdGVkIGZvciBlYWNoIG1vZGVsLgpUaGVzZSBtZXRyaWNzIHF1YW50aWZ5IHRoZSBhdmVyYWdlIHByZWRpY3Rpb24gZXJyb3JzIG9mIGVhY2ggbW9kZWwsIGFuZCBsb3dlciB2YWx1ZXMgYXJlIHByZWZlcnJlZC4KYGBge3J9CiMgQ3JlYXRlIGEgZGF0YSBmcmFtZSB3aXRoIE1BRSBhbmQgUk1TRSB2YWx1ZXMgZm9yIGVhY2ggbW9kZWwKbW9kZWxfbmFtZXMgPC0gYygiTGluZWFyIFJlZ3Jlc3Npb24iLCAiUmFuZG9tIEZvcmVzdCIsICJYR0Jvb3N0IiwiTGluZWFyIFJlZ3Jlc3Npb24iLCAiUmFuZG9tIEZvcmVzdCIsICJYR0Jvb3N0IikKZXJyb3JfdmFsdWVzX3RyYWluIDwtIGMoCiAgbG0udHJhaW5fbWFlLAogIHJmLnRyYWluX21hZSwKICB4Z2IudHJhaW5fbWFlLAogIGxtLnRyYWluX3Jtc2UsCiAgcmYudHJhaW5fcm1zZSwKICB4Z2IudHJhaW5fcm1zZQopCmVycm9yX3ZhbHVlc190ZXN0IDwtIGMoCiAgbG0udGVzdF9tYWUsCiAgcmYudGVzdF9tYWUsCiAgeGdiLnRlc3RfbWFlLAogIGxtLnRlc3Rfcm1zZSwKICByZi50ZXN0X3Jtc2UsCiAgeGdiLnRlc3Rfcm1zZQopCmVycm9yX3R5cGUgPC0gYygKICAiTUFFIiwgIk1BRSIsICJNQUUiLCJSTVNFIiwiUk1TRSIsIlJNU0UiCikKbW9kZWxfZXJyb3JzX3RyYWluIDwtIGRhdGEuZnJhbWUoTW9kZWwgPSBmYWN0b3IobW9kZWxfbmFtZXMsIGxldmVscyA9IGMoIkxpbmVhciBSZWdyZXNzaW9uIiwgIlJhbmRvbSBGb3Jlc3QiLCAiWEdCb29zdCIpKSwKICAgICAgICAgICAgICAgIEVycm9yID0gZXJyb3JfdmFsdWVzX3RyYWluLCBUeXBlID0gZXJyb3JfdHlwZSkKbW9kZWxfZXJyb3JzX3Rlc3QgPC0gZGF0YS5mcmFtZShNb2RlbCA9IGZhY3Rvcihtb2RlbF9uYW1lcywgbGV2ZWxzID0gYygiTGluZWFyIFJlZ3Jlc3Npb24iLCAiUmFuZG9tIEZvcmVzdCIsICJYR0Jvb3N0IikpLAogICAgICAgICAgICAgICAgRXJyb3IgPSBlcnJvcl92YWx1ZXNfdGVzdCwgVHlwZSA9IGVycm9yX3R5cGUpCiMgQ3JlYXRlIHRoZSBNQUUgb3IgUk1TRSBjb21wYXJpc29uIGJhciBjaGFydAplcnJvcl9iYXJfY2hhcnRfdHJhaW4gPC0gZ2dwbG90KG1vZGVsX2Vycm9yc190cmFpbiwgYWVzKHggPSBNb2RlbCwgeSA9IEVycm9yLCBmaWxsID0gVHlwZSkpICsKICBnZW9tX2JhcihzdGF0ID0gImlkZW50aXR5IiwgcG9zaXRpb24gPSAiZG9kZ2UiKSArCiAgbGFicyh4ID0gIk1vZGVsIiwgeSA9ICJFcnJvciBWYWx1ZSIsIHRpdGxlID0gIlRyYWluaW5nIE1BRSBhbmQgUk1TRSBDb21wYXJpc29uIikgKwogIHRoZW1lX21pbmltYWwoKSArCiAgdGhlbWUoYXhpcy50ZXh0LnggPSBlbGVtZW50X3RleHQoYW5nbGUgPSA0NSwgaGp1c3QgPSAxKSkgKyAKICB5bGltKDAsIDQpCgplcnJvcl9iYXJfY2hhcnRfdGVzdCA8LSBnZ3Bsb3QobW9kZWxfZXJyb3JzX3Rlc3QsIGFlcyh4ID0gTW9kZWwsIHkgPSBFcnJvciwgZmlsbCA9IFR5cGUpKSArCiAgZ2VvbV9iYXIoc3RhdCA9ICJpZGVudGl0eSIsIHBvc2l0aW9uID0gImRvZGdlIikgKwogIGxhYnMoeCA9ICJNb2RlbCIsIHkgPSAiRXJyb3IgVmFsdWUiLCB0aXRsZSA9ICJUZXN0aW5nIE1BRSBhbmQgUk1TRSBDb21wYXJpc29uIikgKwogIHRoZW1lX21pbmltYWwoKSArCiAgdGhlbWUoYXhpcy50ZXh0LnggPSBlbGVtZW50X3RleHQoYW5nbGUgPSA0NSwgaGp1c3QgPSAxKSkgKyAKICB5bGltKDAsIDQpCgojIERpc3BsYXkgdGhlIE1BRSBhbmQgUk1TRSBjb21wYXJpc29uIGJhciBjaGFydApwcmludChlcnJvcl9iYXJfY2hhcnRfdHJhaW4pCnByaW50KGVycm9yX2Jhcl9jaGFydF90ZXN0KQpgYGAKCgpgYGB7cn0KIyMjIyBSYW5kb20gRm9yZXN0IEZlYXR1cmUgSW1wb3J0YW5jZSBQbG90ICMjIyMKdjEgPC0gdmlwKHJmLCB0aXRsZSA9ICJSYW5nZXIiLCBudW1fZmVhdHVyZXMgPSAyMCkgCnBsb3QodjEpCmBgYAoKCkxlYXJuaW5nIGN1cnZlIHVzaW5nIFJNU0UgYW5kIFJeMjoKYGBge3J9CiMgVE9ETzogY2hhbmdlIHRoZSB4LWF4ZXMKIyBDcmVhdGUgYSBkYXRhIGZyYW1lIHdpdGggUk1TRSBhbmQgUi1zcXVhcmVkIHZhbHVlcyBmb3IgZWFjaCBtb2RlbCBhbmQgc2FtcGxlIHNpemUKbW9kZWxfbmFtZXMgPC0gYygiTGluZWFyIFJlZ3Jlc3Npb24iLCAiUmFuZG9tIEZvcmVzdCIsICJYR0Jvb3N0IikKc2FtcGxlX3NpemVzIDwtIHNlcSgxMCwgbnJvdyhzYW1wbGVkX3RyYWluX2RhdGEpLCBieSA9IDEwKSAgIyBBZGp1c3QgdGhlIHNhbXBsZSBzaXplcyBhcyBuZWVkZWQKCiMgQ3JlYXRlIGRhdGEgZnJhbWVzIHdpdGggUk1TRSBhbmQgUi1zcXVhcmVkIHZhbHVlcyBmb3IgZWFjaCBtb2RlbApybXNlX2RhdGEgPC0gZGF0YS5mcmFtZSgKICBNb2RlbCA9IHJlcChtb2RlbF9uYW1lcywgZWFjaCA9IGxlbmd0aChzYW1wbGVfc2l6ZXMpKSwKICBTYW1wbGVfU2l6ZSA9IHJlcChzYW1wbGVfc2l6ZXMsIHRpbWVzID0gbGVuZ3RoKG1vZGVsX25hbWVzKSksCiAgUk1TRSA9IGMoCiAgICBsbS50cmFpbl9ybXNlLCByZi50cmFpbl9ybXNlLCB4Z2IudHJhaW5fcm1zZQogICkKKQoKcl9zcXVhcmVkX2RhdGEgPC0gZGF0YS5mcmFtZSgKICBNb2RlbCA9IHJlcChtb2RlbF9uYW1lcywgZWFjaCA9IGxlbmd0aChzYW1wbGVfc2l6ZXMpKSwKICBTYW1wbGVfU2l6ZSA9IHJlcChzYW1wbGVfc2l6ZXMsIHRpbWVzID0gbGVuZ3RoKG1vZGVsX25hbWVzKSksCiAgUl9zcXVhcmVkID0gYygKICAgIGxtLnRyYWluX3IyLCByZi50cmFpbl9yMiwgeGdiLnRyYWluX3IyCiAgKQopCgojIENyZWF0ZSBSTVNFIGxlYXJuaW5nIGN1cnZlCnJtc2VfY3VydmUgPC0gZ2dwbG90KHJtc2VfZGF0YSwgYWVzKHggPSBTYW1wbGVfU2l6ZSwgeSA9IFJNU0UsIGNvbG9yID0gTW9kZWwpKSArCiAgZ2VvbV9saW5lKCkgKwogIGxhYnMoeCA9ICJTYW1wbGUgU2l6ZSIsIHkgPSAiUk1TRSIsIHRpdGxlID0gIlJNU0UgTGVhcm5pbmcgQ3VydmUiKSArCiAgdGhlbWVfbWluaW1hbCgpCgojIENyZWF0ZSBSLXNxdWFyZWQgbGVhcm5pbmcgY3VydmUKcl9zcXVhcmVkX2N1cnZlIDwtIGdncGxvdChyX3NxdWFyZWRfZGF0YSwgYWVzKHggPSBTYW1wbGVfU2l6ZSwgeSA9IFJfc3F1YXJlZCwgY29sb3IgPSBNb2RlbCkpICsKICBnZW9tX2xpbmUoKSArCiAgbGFicyh4ID0gIlNhbXBsZSBTaXplIiwgeSA9ICJSLXNxdWFyZWQiLCB0aXRsZSA9ICJSLXNxdWFyZWQgTGVhcm5pbmcgQ3VydmUiKSArCiAgdGhlbWVfbWluaW1hbCgpCgojIERpc3BsYXkgdGhlIFJNU0UgYW5kIFItc3F1YXJlZCBsZWFybmluZyBjdXJ2ZXMKcHJpbnQocm1zZV9jdXJ2ZSkKcHJpbnQocl9zcXVhcmVkX2N1cnZlKQpgYGAKCgoKQWRkIGEgbmV3IGNodW5rIGJ5IGNsaWNraW5nIHRoZSAqSW5zZXJ0IENodW5rKiBidXR0b24gb24gdGhlIHRvb2xiYXIgb3IgYnkgcHJlc3NpbmcgKkN0cmwrQWx0K0kqLgoKV2hlbiB5b3Ugc2F2ZSB0aGUgbm90ZWJvb2ssIGFuIEhUTUwgZmlsZSBjb250YWluaW5nIHRoZSBjb2RlIGFuZCBvdXRwdXQgd2lsbCBiZSBzYXZlZCBhbG9uZ3NpZGUgaXQgKGNsaWNrIHRoZSAqUHJldmlldyogYnV0dG9uIG9yIHByZXNzICpDdHJsK1NoaWZ0K0sqIHRvIHByZXZpZXcgdGhlIEhUTUwgZmlsZSkuCgpUaGUgcHJldmlldyBzaG93cyB5b3UgYSByZW5kZXJlZCBIVE1MIGNvcHkgb2YgdGhlIGNvbnRlbnRzIG9mIHRoZSBlZGl0b3IuIENvbnNlcXVlbnRseSwgdW5saWtlICpLbml0KiwgKlByZXZpZXcqIGRvZXMgbm90IHJ1biBhbnkgUiBjb2RlIGNodW5rcy4gSW5zdGVhZCwgdGhlIG91dHB1dCBvZiB0aGUgY2h1bmsgd2hlbiBpdCB3YXMgbGFzdCBydW4gaW4gdGhlIGVkaXRvciBpcyBkaXNwbGF5ZWQuCg==